Valid HTML 4.0! Valid CSS!
%%% -*-BibTeX-*-
%%% ====================================================================
%%%  BibTeX-file{
%%%     author          = "Nelson H. F. Beebe",
%%%     version         = "1.17",
%%%     date            = "12 April 2024",
%%%     time            = "09:42:59 MST",
%%%     filename        = "ieeeacmtaslp.bib",
%%%     address         = "University of Utah
%%%                        Department of Mathematics, 110 LCB
%%%                        155 S 1400 E RM 233a
%%%                        Salt Lake City, UT 84112-0090
%%%                        USA",
%%%     telephone       = "+1 801 581 5254",
%%%     FAX             = "+1 801 581 4148",
%%%     URL             = "",
%%%     checksum        = "50257 65862 250970 2818881",
%%%     email           = "beebe at, beebe at,
%%%                        beebe at (Internet)",
%%%     codetable       = "ISO/ASCII",
%%%     keywords        = "bibliography; BibTeX; IEEE/ACM Transactions
%%%                        on Audio, Speech, and Language Processing",
%%%     license         = "public domain",
%%%     supported       = "yes",
%%%     docstring       = "This is a COMPLETE bibliography of the
%%%                        journal IEEE/ACM Transactions on Audio,
%%%                        Speech, and Language Processing (CODEN none,
%%%                        ISSN 2329-9290). The journal began publishing
%%%                        in 2014 as the merger of the journals ACM
%%%                        Transactions on Speech and Language
%%%                        Processing (TSLP) (2004--2013) and IEEE
%%%                        Transactions on Audio, Speech, and Language
%%%                        Processing (2006--2013).  The initial volume
%%%                        of the merged journal is 22, continuing the
%%%                        numbering of the IEEE parent journal.
%%%                        The journal has Web sites at
%%%                        At version 1.17, the COMPLETE journal
%%%                        coverage looked like this:
%%%                             2014 ( 298)    2018 ( 276)    2022 ( 121)
%%%                             2015 ( 292)    2019 ( 209)    2023 ( 311)
%%%                             2016 ( 265)    2020 (  60)    2024 ( 155)
%%%                             2017 ( 275)    2021 ( 292)
%%%                             Article:       2554
%%%                             Total entries: 2554
%%%                        The checksum field above contains a CRC-16
%%%                        checksum as the first value, followed by the
%%%                        equivalent of the standard UNIX wc (word
%%%                        count) utility output of lines, words, and
%%%                        characters.  This is produced by Robert
%%%                        Solovay's checksum utility.",
%%%  }
%%% ====================================================================
    "\input bibnames.sty" #
    "\ifx \undefined \dbar \def \dbar {\leavevmode\raise0.2ex\hbox{--}\kern-0.5emd} \fi" #
    "\ifx \undefined \Dbar \def \Dbar {\leavevmode\raise0.2ex\hbox{--}\kern-0.5emD} \fi" #
    "\ifx \undefined \ocirc      \def \ocirc #1{{\accent'27#1}}\fi" #
    "\ifx \undefined \r          \def \r #1{\ocirc{#1}} \fi"

%%% ====================================================================
%%% Acknowledgement abbreviations:
@String{ack-nhfb = "Nelson H. F. Beebe,
                    University of Utah,
                    Department of Mathematics, 110 LCB,
                    155 S 1400 E RM 233,
                    Salt Lake City, UT 84112-0090, USA,
                    Tel: +1 801 581 5254,
                    FAX: +1 801 581 4148,
                    e-mail: \path|[email protected]|,
                            \path|[email protected]|,
                            \path|[email protected]| (Internet),
                    URL: \path||"}

%%% ====================================================================
%%% Journal abbreviations:
@String{j-IEEE-ACM-TASLP        = "IEEE\slash ACM Transactions on Audio, Speech,
                                  and Language Processing"}

%%% ====================================================================
%%% Bibliography entries, sorted in publication order:
  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "1--2",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "3--4",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "L. Deng and S. Renals and M. Federico and M.
  title =        "Editorial: Expanding the Technical Reach of our
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "5--5",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Taghia and R. Martin",
  title =        "Objective Intelligibility Measures Based on Mutual
                 Information for Speech Subjected to Speech Enhancement
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "6--16",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Liang Lu and A. Ghoshal and S. Renals",
  title =        "Cross-Lingual Subspace {Gaussian} Mixture Models for
                 Low-Resource Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "17--27",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Gasic and S. Young",
  title =        "{Gaussian} Processes for {POMDP}-Based Dialogue
                 Manager Optimization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "28--40",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "I. Mezghani-Marrakchi and G. Mahe and S. Djaziri-Larbi
                 and M. Jaidane and M. Turki-Hadj Alouane",
  title =        "Nonlinear Audio Systems Identification Through Audio
                 Input {Gaussianization}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "41--53",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. B. Crespo and R. C. Hendriks",
  title =        "Multizone Speech Reinforcement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "54--66",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chao Pan and Jingdong Chen and J. Benesty",
  title =        "Performance Study of the {MVDR} Beamformer as a
                 Function of the Source Incidence Angle",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "67--79",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hung-yi Lee and Lin-shan Lee",
  title =        "Improved Semantic Retrieval of Spoken Content by
                 Document\slash Query Expansion with Random Walk Over
                 Acoustic Similarity Graphs",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "80--94",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "V. Leutnant and A. Krueger and R. Haeb-Umbach",
  title =        "A New Observation Model in the Logarithmic Mel Power
                 Spectral Domain for the Automatic Recognition of Noisy
                 Reverberant Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "95--109",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "N. F. Chen and S. W. Tam and Wade Shen and J. P.
  title =        "Characterizing Phonetic Transformations and Acoustic
                 Differences Across {English} Dialects",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "110--124",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Markovic and K. Kowalczyk and F. Antonacci and C.
                 Hofmann and A. Sarti and W. Kellermann",
  title =        "Estimation of Acoustic Reflection Coefficients Through
                 Pseudospectrum Matching",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "125--137",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhiyao Duan and Jinyu Han and B. Pardo",
  title =        "Multi-pitch Streaming of Harmonic Sound Mixtures",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "138--150",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shilin Liu and Khe Chai Sim",
  title =        "Temporally Varying Weight Regression: A
                 Semi-Parametric Trajectory Model for Automatic Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "151--160",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "V. S. Tomar and R. C. Rose",
  title =        "A Family of Discriminative Manifold Learning
                 Algorithms and Their Application to Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "161--171",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Doi and T. Toda and K. Nakamura and H. Saruwatari
                 and K. Shikano",
  title =        "Alaryngeal Speech Enhancement Based on One-to-Many
                 Eigenvoice Conversion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "172--183",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "E. Arisoy and S. F. Chen and B. Ramabhadran and A.
  title =        "Converting Neural Network Language Models into
                 Back-off Language Models for Efficient Decoding in
                 Automatic Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "184--192",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "C. T. Jin and N. Epain and A. Parthy",
  title =        "Design, Optimization and Evaluation of a Dual-Radius
                 Spherical Microphone Array",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "193--204",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. Mignot and G. Chardon and L. Daudet",
  title =        "Low Frequency Interpolation of Room Impulse Responses
                 Using Compressed Sensing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "205--216",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Senoussaoui and P. Kenny and T. Stafylakis and P.
  title =        "A Study of the Cosine Distance-Based Mean Shift for
                 Telephone Speech Diarization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "217--227",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Tachibana and N. Ono and S. Sagayama",
  title =        "Singing Voice Enhancement in Monaural Music Signals
                 Based on Two-stage Harmonic\slash Percussive Sound
                 Separation on Multiple Resolution Spectrograms",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "228--237",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "N. R. Shabtai and B. Rafaely",
  title =        "Generalized Spherical Array Beamforming for Binaural
                 Speech Reproduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "238--247",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Cumani and P. Laface",
  title =        "Factorized Sub-Space Estimation for Fast and Memory
                 Effective {$I$}-vector Extraction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "248--259",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuan Zeng and R. C. Hendriks",
  title =        "Distributed Delay and Sum Beamformer for Speech
                 Enhancement via Randomized Gossip",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "260--273",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhenghua Li and Min Zhang and Wanxiang Che and Ting
                 Liu and Wenliang Chen",
  title =        "Joint Optimization for {Chinese} {POS} Tagging and
                 Dependency Parsing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "274--286",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing --- EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "289--290",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "291--292",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "293--293",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "B287--B288",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "C1",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "C2",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "C3",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page --- back cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "1",
  pages =        "C4",
  month =        jan,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "289--290",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "291--292",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dehong Gao and Wenjie Li and Xiaoyan Cai and Renxian
                 Zhang and You Ouyang",
  title =        "Sequential Summarization: a Full View of {Twitter}
                 Trending Topics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "293--302",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "P. W. J. van Hengel and J. D. Krijnders",
  title =        "A Comparison of Spectro-Temporal Representations of
                 Audio Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "303--313",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "I. Zitouni and Y. Benajiba",
  title =        "Aligned-Parallel-Corpora Based Semi-Supervised
                 Learning for {Arabic} Mention Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "314--324",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "E. Molina and A. M. Barbancho and L. J. Tardon and I.
  title =        "Dissonance Reduction In Polyphonic Audio Using
                 Harmonic Reorganization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "325--334",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. P. K. Lun and Tak-Wai Shen and K. C. Ho",
  title =        "A Novel Expectation-Maximization Framework for Speech
                 Enhancement in Non-Stationary Noise Environments",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "335--346",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Cosentino and T. H. Falk and D. McAlpine and T.
  title =        "Cochlear Implant Filterbank Design and Optimization: A
                 Simulation Study",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "347--353",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Souden and K. Kinoshita and M. Delcroix and T.
  title =        "Location Feature Integration for Clustering-Based
                 Speech Separation in Distributed Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "354--367",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Kallasjoki and J. F. Gemmeke and K. J. Palomaki",
  title =        "Estimating Uncertainty to Improve Exemplar-Based
                 Feature Enhancement for Noise Robust Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "368--380",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Hasan and J. H. L. Hansen",
  title =        "Maximum Likelihood Acoustic Factor Analysis Models for
                 Robust Speaker Verification in Noise",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "381--391",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "O. Schwartz and S. Gannot",
  title =        "Speaker Tracking Using Recursive {EM} Algorithms",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "392--402",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yu Tsao and S. Matsuda and C. Hori and H. Kashioka and
                 Chin-Hui Lee",
  title =        "A {MAP}-based Online Estimation Approach to Ensemble
                 Speaker and Speaking Environment Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "403--416",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Pui-Yu Hui and H. Meng",
  title =        "Latent Semantic Analysis for Multimodal User Input
                 With Speech and Gestures",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "417--429",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Jensen and C. H. Taal",
  title =        "Speech Intelligibility Prediction Based on Mutual
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "430--440",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Primavera and S. Cecchi and Junfeng Li and F.
  title =        "Objective and Subjective Investigation on a Novel
                 Method for Digital Reverberator Parameters Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "441--452",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Speed and D. Murphy and D. Howard",
  title =        "Modeling the Vocal Tract Transfer Function Using a
                 {$3$D} Digital Waveguide Mesh",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "453--464",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H{\"u}seyim Hac{\i}habibo{\u{g}}lu",
  title =        "Theoretical Analysis of Open Spherical Microphone
                 Arrays for Acoustic Intensity Measurements",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "465--476",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Taemin Cho and J. P. Bello",
  title =        "On the Relative Importance of Individual Components of
                 Chord Recognition Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "477--492",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Otsuka and K. Ishiguro and H. Sawada and H. G.
  title =        "{Bayesian} Nonparametrics for Microphone Array
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "493--504",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jianjun He and Ee-Leng Tan and Woon-Seng Gan",
  title =        "Linear Estimation Based Primary-Ambient Extraction for
                 Stereo Audio Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "505--517",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Gonzalez and M. Brookes",
  title =        "{PEFAC} --- A Pitch Estimation Algorithm Robust to
                 High Levels of Noise",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "518--530",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Min Zhang and Xiangyu Duan and Wenliang Chen",
  title =        "{Bayesian} Constituent Context Model for Grammar
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "531--541",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dah-Chung Chang and Fei-Tao Chu",
  title =        "Feedforward Active Noise Control With a New Variable
                 Tap-Length and Step-Size Filtered-{X} {LMS} Algorithm",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "542--555",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. McVicar and R. Santos-Rodriguez and Yizhao Ni and
                 Tijl {De Bie}",
  title =        "Automatic Chord Estimation from Audio: a Review of the
                 State of the Art",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "556--575",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} --- {EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "576--577",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "578--579",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "580--580",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "C1",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "C2",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "C3",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page --- back cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "2",
  pages =        "C4",
  month =        feb,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:30 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "581--582",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "583--584",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chung-Hsien Wu and Yi-Chin Huang and Chung-Han Lee and
                 Jun-Cheng Guo",
  title =        "Synthesis of Spontaneous Speech With Syllable
                 Contraction Using State-Based Context-Dependent Voice
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "585--595",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Airaksinen and T. Raitio and B. Story and P. Alku",
  title =        "Quasi Closed Phase Glottal Inverse Filtering Analysis
                 With Weighted Linear Prediction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "596--607",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jae-Mo Yang and Hong-Goo Kang",
  title =        "Online Speech Dereverberation Algorithm Based on
                 Adaptive Multichannel Linear Prediction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "608--619",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Asaei and M. Golbabaee and H. Bourlard and V.
  title =        "Structured Sparsity Models for Reverberant Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "620--633",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. S. Rashobh and A. W. H. Khong and Di Liu",
  title =        "Multichannel Equalization in the {KLT} and Frequency
                 Domains With Application to Speech Dereverberation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "634--646",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "P. Samarasinghe and T. Abhayapala and M. Poletti",
  title =        "Wavefield Analysis Over Large Areas Using Distributed
                 Higher Order Microphones",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "647--658",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wen-Li Wei and Chung-Hsien Wu and Jen-Chun Lin and Han
  title =        "Exploiting Psychological Factors for Interaction Style
                 Recognition in Spoken Conversation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "659--671",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. A. Raczy{\'n}ski and E. Vincent",
  title =        "Genre-Based Music Language Modeling with Latent
                 Hierarchical {Pitman}-Yor Process Allocation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "672--681",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dalei Wu and Wei-Ping Zhu and M. N. S. Swamy",
  title =        "The Theory of Compressive Sensing Matching Pursuit
                 Considering Time-domain Noise with Application to
                 Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "682--696",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Nanjundaswamy and K. Rose",
  title =        "Cascaded Long Term Prediction for Enhanced Compression
                 of Polyphonic Audio Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "697--710",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "K. Audhkhasi and A. M. Zavou and P. G. Georgiou and S.
                 S. Narayanan",
  title =        "Theoretical Analysis of Diversity in an Ensemble of
                 Automatic Speech Recognition Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "711--726",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Nikunen and T. Virtanen",
  title =        "Direction of Arrival Based Spatial Covariance Model
                 for Blind Sound Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "727--739",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "741--742",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "743--744",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "745--745",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Publish your article in {IEEE Access}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "746--746",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "B740",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Front} cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "C1",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "C2",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "C3",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page --- back cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "3",
  pages =        "C4",
  month =        mar,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:36 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "741--742",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "743--744",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jinyu Li and Li Deng and Yifan Gong and R.
  title =        "An Overview of Noise-Robust Automatic Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "745--777",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. Sarikaya and G. E. Hinton and A. Deoras",
  title =        "Application of Deep Belief Networks for Natural
                 Language Understanding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "778--784",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. Serizel and M. Moonen and B. {Van Dijk} and J.
  title =        "Low-rank Approximation Based Multichannel {Wiener}
                 Filter Algorithms for Noise Reduction with Application
                 in Cochlear Implants",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "785--799",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Crocco and A. Trucco",
  title =        "Design of Superdirective Planar Arrays With Sparse
                 Aperiodic Layouts for Processing Broadband Signals via
                 {$3$-D} Beamforming",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "800--815",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. R. Zapata and M. E. P. Davies and E. Gomez",
  title =        "Multi-Feature Beat Tracking",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "816--825",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Narayanan and Deliang Wang",
  title =        "Investigation of Speech Separation as a Front-End for
                 Noise Robust Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "826--835",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaojia Zhao and Yuxuan Wang and Deliang Wang",
  title =        "Robust Speaker Identification in Noisy and Reverberant
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "836--845",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Cumani and O. Plchot and P. Laface",
  title =        "On the use of $i$-vector posterior distributions in
                 Probabilistic Linear Discriminant Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "846--857",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chung-Hsien Wu and Han-Ping Shen and Yan-Ting Yang",
  title =        "{Chinese--English} Phone Set Construction for
                 Code-Switching {ASR} Using Acoustic and {DNN}-Extracted
                 Articulatory Features",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "858--862",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "863--864",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "865--866",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "867--867",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Publish your article in {IEEE Access}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "868--868",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Front} cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "C1",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "C2",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "C3",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page --- back cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "4",
  pages =        "C4",
  month =        apr,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "869--870",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "871--872",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Weibin Zhang and P. Fung",
  title =        "Discriminatively Trained Sparse Inverse Covariance
                 Matrices for Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "873--882",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hung-yi Lee and Sz-Rung Shiang and Ching-Feng Yeh and
                 Yun-Nung Chen and Yu Huang and Sheng-Yi Kong and
                 Lin-shan Lee",
  title =        "Spoken Knowledge Organization by Semantic Structuring
                 and a Prototype Course Lecture System for Personalized
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "883--898",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "L. Z{\~a}o and R. Coelho and P. Flandrin",
  title =        "Speech Enhancement with {EMD} and {Hurst}-Based Mode
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "899--911",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Giacobello and M. G. Christensen and T. L. Jensen
                 and M. N. Murthi and S. H. Jensen and M. Moonen",
  title =        "Stable $1$-Norm Error Minimization Based Linear
                 Predictors for Speech Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "912--922",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Y. Lacouture-Parodi and E. A. P. Habets and Jingdong
                 Chen and J. Benesty",
  title =        "Multichannel Noise Reduction in the
                 {Karhunen--Lo{\`e}ve} Expansion Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "923--936",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. O. Sadjadi and J. H. L. Hansen",
  title =        "Blind Spectral Weighting for Robust Speaker
                 Identification under Reverberation Mismatch",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "937--945",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "G. Mantena and S. Achanta and K. Prahallad",
  title =        "Query-by-Example Spoken Term Detection using Frequency
                 Domain Linear Prediction and Non-Segmental Dynamic Time
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "946--955",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "C. Osterwise and S. L. Grant",
  title =        "On Over-Determined Frequency Domain {BSS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "956--966",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. P. Jarrett and M. Taseska and E. A. P. Habets and
                 P. A. Naylor",
  title =        "Noise Reduction in the Spherical Harmonic Domain Using
                 a Tradeoff Beamformer and Narrowband {DOA} Estimates",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "967--978",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "V. Rieser and O. Lemon and S. Keizer",
  title =        "Natural Language Generation as Incremental Planning
                 Under Uncertainty: Adaptive Information Presentation
                 for Statistical Dialogue Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "979--994",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Cheer and S. J. Elliott",
  title =        "Comments on {``Complete Parallel Narrowband Active
                 Noise Control Systems''}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "995--996",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "999--1000",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "1001--1002",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "B997--B998",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Front} cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "C1",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "C2",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "C3",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page --- back cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "5",
  pages =        "C4",
  month =        may,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:37 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "999--1000",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "1001--1002",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "V. Arora and L. Behera",
  title =        "Musical Source Clustering and Identification in
                 Polyphonic Audio",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "1003--1012",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. C. Nongpiur",
  title =        "Design of Minimax Broadband Beamformers that are
                 Robust to Microphone Gain, Phase, and Position Errors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "1013--1022",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Venkitaraman and C. S. Seelamantula",
  title =        "Binaural Signal Processing Motivated Generalized
                 Analytic Signal Construction and {AM--FM}
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "1023--1036",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. T. Geiger and F. Weninger and J. F. Gemmeke and M.
                 Wollmer and B. Schuller and G. Rigoll",
  title =        "Memory-Enhanced Neural Networks and {NMF} for Robust
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "1037--1046",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Haiquan Zhao and Yi Yu and Shibin Gao and Xiangping
                 Zeng and Zhengyou He",
  title =        "Memory Proportionate {APA} with Individual Activation
                 Factors for Acoustic Echo Cancellation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "1047--1055",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. J. Gangeh and P. Fewzee and A. Ghodsi and M. S.
                 Kamel and F. Karray",
  title =        "Multiview Supervised Dictionary Learning in Speech
                 Emotion Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "1056--1068",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jae-Hun Choi and Joon-Hyuk Chang",
  title =        "Dual-Microphone Voice Activity Detection Technique
                 Based on Two-Step Power Level Difference Ratio",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "1069--1081",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "X. Alameda-Pineda and R. Horaud",
  title =        "A Geometric Approach to Sound Source Localization from
                 Time-Delay Estimates",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "1082--1095",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "K. Reindl and S. Meier and H. Barfuss and W.
  title =        "Minimum Mutual Information-Based Linearly Constrained
                 Broadband Signal Extraction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "1096--1108",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "1109--1110",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "1111--1112",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Front} cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "C1",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "C2",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "C3",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page --- back cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "6",
  pages =        "C4",
  month =        jun,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "1113--1114",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "1115--1116",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. H. Bahari and N. Dehak and H. {Van hamme} and L.
                 Burget and A. M. Ali and J. Glass",
  title =        "Non-Negative Factor Analysis of {Gaussian} Mixture
                 Model Weight Adaptation for Language and Dialect
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "1117--1129",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Guangzhao Bao and Yangfei Xu and Zhongfu Ye",
  title =        "Learning a Discriminative Dictionary for
                 Single-Channel Speech Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "1130--1138",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "I. J. Kelly and F. M. Boland",
  title =        "Detecting Arrivals in Room Impulse Responses With
                 Dynamic Time Warping",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "1139--1147",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Guldenschuh and R. de Callafon",
  title =        "Detection of Secondary-Path Irregularities in Active
                 Noise Control Headphones",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "1148--1157",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sin-Horng Chen and Chiao-Hua Hsieh and Chen-Yu Chiang
                 and Hsi-Chun Hsiao and Yih-Ru Wang and Yuan-Fu Liao and
                 Hsiu-Min Yu",
  title =        "Modeling of Speaking Rate Influences on {Mandarin}
                 Speech Prosody and Its Application to Speaking
                 Rate-controlled {TTS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "1158--1171",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Comminiello and M. Scarpiniti and L. A.
                 Azpicueta-Ruiz and J. Arenas-Garcia and A. Uncini",
  title =        "Nonlinear Acoustic Echo Cancellation Based on Sparse
                 Functional Link Representations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "1172--1183",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wen Zhang and T. D. Abhayapala",
  title =        "Three Dimensional Sound Field Reproduction using
                 Multiple Circular Loudspeaker Arrays: Functional
                 Analysis Guided Approach",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "1184--1194",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Taseska and E. A. P. Habets",
  title =        "Informed Spatial Filtering for Sound Extraction Using
                 Distributed Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "1195--1207",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mo Shen and D. Kawahara and S. Kurohashi",
  title =        "Dependency Parse Reranking with Rich Subtree
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "1208--1218",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "1221--1222",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "1223--1224",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "1225--1225",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "B1219--B1220",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Front} cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "C1",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "C2",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "C3",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page --- back cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "7",
  pages =        "C4",
  month =        jul,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:38 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "1221--1222",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "1223--1224",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhibao Li and K. F. C. Yiu and S. Nordholm",
  title =        "On the Indoor Beamformer Design With Reverberation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "1225--1235",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. B. Hawes and Wei Liu",
  title =        "Sparse Array Design for Wideband Beamforming With
                 Reduced Complexity in Tapped Delay-Lines",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "1236--1247",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi FanChiang and Cheng-Wen Wei and Yi-Le Meng and
                 Yu-Wen Lin and Shyh-Jye Jou and Tian-Sheuan Chang",
  title =        "Low Complexity Formant Estimation Adaptive Feedback
                 Cancellation for Hearing Aids Using Pitch Based
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "1248--1259",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  note =         "See correction \cite{FanChiang:2014:CLC}.",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Conan and O. Derrien and M. Aramaki and S. Ystad
                 and R. Kronland-Martinet",
  title =        "A Synthesis Model With Intuitive Control Capabilities
                 for Rolling Sounds",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "1260--1273",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "C. Schuldt and P. Handel",
  title =        "Decay Rate Estimators and Their Performance for Blind
                 Reverberation Time Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "1274--1284",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Ganapathy and S. H. Mallidi and H. Hermansky",
  title =        "Robust Feature Extraction Using Modulation Filtering
                 of Autoregressive Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "1285--1295",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bo Li and Khe Chai Sim",
  title =        "A Spectral Masking Approach to Noise-Robust Speech
                 Recognition Using Deep Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "1296--1305",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "E. Yilmaz and J. F. Gemmeke and H. {Van hamme}",
  title =        "Noise Robust Exemplar Matching Using Sparse
                 Representations of Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "1306--1319",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Schmid and G. Enzner and S. Malik and D. Kolossa
                 and R. Martin",
  title =        "Variational {Bayesian} Inference for Multichannel
                 Dereverberation and Noise Reduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "1320--1335",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "1336--1337",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "1338--1339",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "1340--1340",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Front} cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "C1",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "C2",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "C3",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page --- back cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "8",
  pages =        "C4",
  month =        aug,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1341--1342",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1343--1344",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "B. Masiero and M. Vorlander",
  title =        "A Framework for the Calculation of Dynamic Crosstalk
                 Cancellation Filters",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1345--1354",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Schasse and R. Martin",
  title =        "Estimation of Subband Speech Correlations for Noise
                 Reduction via {MVDR} Processing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1355--1365",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Michal Novotn{\'y} and Jan Rusz and Roman {\v{C}}mejla
                 and Ev{\v{z}}en R{\r{u}}{\v{z}}i{\v{c}}ka",
  title =        "Automatic Evaluation of Articulatory Disorders in
                 {Parkinson}'s Disease",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1366--1378",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "F. Lim and Wancheng Zhang and E. A. P. Habets and P.
                 A. Naylor",
  title =        "Robust Multichannel Dereverberation using Relaxed
                 Multichannel Least Squares",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1379--1390",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. H. Ghalehjegh and R. C. Rose",
  title =        "Linear Regression Based Acoustic Adaptation for the
                 Subspace {Gaussian} Mixture Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1391--1402",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Botts and L. Savioja",
  title =        "Spectral and Pseudospectral Properties of Finite
                 Difference Models Used in Audio and Room Acoustics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1403--1412",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yong Xiang and I. Natgunanathan and Song Guo and
                 Wanlei Zhou and S. Nahavandi",
  title =        "Patchwork-Based Audio Watermarking Method Robust to
                 De-synchronization Attacks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1413--1423",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "I. V. McLoughlin",
  title =        "Super-Audible Voice Activity Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1424--1433",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Alinaghi and P. J. Jackson and Qingju Liu and Wenwu
  title =        "Joint Mixing Vector and Binaural Model Based Stereo
                 Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1434--1448",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1451--1452",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1453--1454",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1455--1455",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Together, we are advancing technology",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "1456--1456",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "B1449--B1450",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "C1",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "C2",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "C3",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page --- back cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "9",
  pages =        "C4",
  month =        sep,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:39 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1451--1452",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1453--1454",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Liheng Zhao and J. Benesty and Jingdong Chen",
  title =        "Design of Robust Differential Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1455--1466",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "P. Jain and R. B. Pachori",
  title =        "Event-Based Method for Instantaneous Fundamental
                 Frequency Estimation from Voiced Speech Based on
                 Eigenvalue Decomposition of the {Hankel} Matrix",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1467--1482",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Y. Vaizman and B. McFee and G. Lanckriet",
  title =        "Codebook-Based Audio Feature Representation for Music
                 Information Retrieval",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1483--1493",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "O. Nadiri and B. Rafaely",
  title =        "Localization of Multiple Speakers under High
                 Reverberation using a Spherical Microphone Array and
                 the Direct-Path Dominance Test",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1494--1505",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhizheng Wu and T. Virtanen and Eng Siong Chng and
                 Haizhou Li",
  title =        "Exemplar-Based Sparse Representation With Residual
                 Compensation for Voice Conversion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1506--1521",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. S. Talagala and Wen Zhang and T. D. Abhayapala",
  title =        "Efficient Multi-Channel Adaptive Room Compensation for
                 Spatial Soundfield Reproduction Using a Modal
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1522--1532",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "O. Abdel-Hamid and A.-R. Mohamed and Hui Jiang and Li
                 Deng and G. Penn and Dong Yu",
  title =        "Convolutional Neural Networks for Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1533--1545",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Koyama and K. Furuya and Y. Hiwasaki and Y. Haneda
                 and Y. Suzuki",
  title =        "Wave Field Reconstruction Filtering in Cylindrical
                 Harmonic Domain for With-Height Recording and
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1546--1557",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chia-Ping Chen and Yi-Chin Huang and Chung-Hsien Wu
                 and Kuan-De Lee",
  title =        "Polyglot Speech Synthesis Based on Cross-Lingual Frame
                 Selection Using Auditory and Articulatory Features",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1558--1570",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1571--1572",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1573--1574",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1575--1575",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Together, we are advancing technology",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "1576--1576",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "C1",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "C2",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "C3",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page --- back cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "10",
  pages =        "C4",
  month =        oct,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "1577--1578",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "1579--1580",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jian Xu and Zhi-Jie Yan and Qiang Huo",
  title =        "An Unsupervised Adaptation Approach to Leveraging
                 Feedback Loop Data by Using $i$-Vector for Data
                 Clustering and Selection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "1581--1589",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Cumani and P. Laface",
  title =        "Large-Scale Training of Pairwise Support Vector
                 Machines for Speaker Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "1590--1600",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jun Du and Qiang Huo",
  title =        "An Improved {VTS} Feature Compensation using Mixture
                 Models of Distortion and {IVN} Training for Noisy
                 Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "1601--1611",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Togami and Y. Kawaguchi",
  title =        "Simultaneous Optimization of Acoustic Echo Reduction,
                 Speech Dereverberation, and Noise Reduction against
                 Mutual Interference",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "1612--1623",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Lorente and M. Ferrer and M. de Diego and A.
  title =        "{GPU} Implementation of Multichannel Adaptive
                 Algorithms for Local Active Noise Control",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "1624--1635",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Helie",
  title =        "Simulation of Fractional-Order Low-Pass Filters",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "1636--1647",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "B. Defraene and T. van Waterschoot and M. Diehl and M.
  title =        "Embedded-Optimization-Based Loudspeaker
                 Precompensation Using a {Hammerstein} Loudspeaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "1648--1659",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Guangsen Wang and Khe Chai Sim",
  title =        "Regression-Based Context-Dependent Modeling of Deep
                 Neural Networks for Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "1660--1669",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. Badeau and M. D. Plumbley",
  title =        "Multichannel High-Resolution {NMF} for Modeling
                 Convolutive Mixtures of Non-Stationary Signals in the
                 Time-Frequency Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "1670--1680",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "1683--1684",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "1685--1686",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "B1681--B1682",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "C1",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "C2",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "C3",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page --- back cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "11",
  pages =        "C4",
  month =        nov,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1683--1685",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Deng",
  title =        "Farewell editorial: Keeping up the momentum of
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1687--1687",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. H. Yella and H. Bourlard",
  title =        "Overlapping Speech Detection Using Long-Term
                 Conversational Features for Speaker Diarization in
                 Meeting Room Conversations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1688--1700",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. K. Chivukula and Y. A. Reznik and Yanyan Hu and V.
                 Devarajan and M. Jayendra-Lakshman",
  title =        "Fast Algorithms for Low-Delay {TDAC} Filterbanks in
                 {MPEG-4} {AAC--ELD}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1701--1712",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shaofei Xue and O. Abdel-Hamid and Hui Jiang and
                 Lirong Dai and Qingfeng Liu",
  title =        "Fast Adaptation of Deep Neural Network Based on
                 Discriminant Codes for Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1713--1725",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. E. P. Davies and P. Hamel and K. Yoshii and M.
  title =        "{AutoMashUpper}: Automatic Creation of Multi-Song
                 Music Mashups",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1726--1737",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chao Weng and D. L. Thomson and P. Haffner and B.-H.
                 F. Juang",
  title =        "Latent Semantic Rational Kernels for Topic Spotting on
                 Conversational Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1738--1749",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "N. Wachowski and M. R. Azimi-Sadjadi",
  title =        "Detection and Classification of Nonstationary
                 Transient Signals Using Sparse Approximations and
                 {Bayesian} Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1750--1764",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "G. Percival and G. Tzanetakis",
  title =        "Streamlined Tempo Estimation Based on Autocorrelation
                 and Cross-correlation With Pulses",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1765--1776",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Barkefors and M. Sternad and L.-J. Brannmark",
  title =        "Design and Analysis of Linear Quadratic {Gaussian}
                 Feedforward Controllers for Active Noise Control",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1777--1791",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Cobos and J. J. Perez-Solano and S. Felici-Castell
                 and J. Segura and J. M. Navarro",
  title =        "Cumulative-Sum-Based Localization of Sound Events in
                 Low-Cost Wireless Acoustic Sensor Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1792--1802",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "V. Tourbabin and B. Rafaely",
  title =        "Theoretical Framework for the Optimization of
                 Microphone Array Configuration for Humanoid Robot
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1803--1814",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Y. Zakharov and V. H. Nascimento",
  title =        "Sliding-Window {RLS} Low-Cost Implementation of
                 Proportionate Affine Projection Algorithms",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1815--1824",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. D'Angelo and V. Valimaki",
  title =        "Generalized {Moog} Ladder Filter: {Part I} --- Linear
                 Analysis and Parameterization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1825--1832",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Na Yang and He Ba and Weiyang Cai and I. Demirkol and
                 W. Heinzelman",
  title =        "{BaNa}: a Noise Resilient Fundamental Frequency
                 Detection Algorithm for Speech and Music",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1833--1848",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuxuan Wang and A. Narayanan and Deliang Wang",
  title =        "On Training Targets for Supervised Speech Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1849--1858",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ling-Hui Chen and Zhen-Hua Ling and Li-Juan Liu and
                 Li-Rong Dai",
  title =        "Voice Conversion Using Deep Neural Networks With
                 Layer-Wise Generative Training",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1859--1872",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. D'Angelo and V. Valimaki",
  title =        "Generalized {Moog} Ladder Filter: {Part II} ---
                 Explicit Nonlinear Model through a Novel Delay-Free
                 Loop Implementation Method",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1873--1883",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Z. Rafii and Zhiyao Duan and B. Pardo",
  title =        "Combining Rhythm-Based and Pitch-Based Methods for
                 Background and Melody Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1884--1893",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Ramo and V. Valimaki and B. Bank",
  title =        "High-Precision Parallel Graphic Equalizer",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1894--1904",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Y. Panagakis and C. L. Kotropoulos and G. R. Arce",
  title =        "Music Genre Classification via Joint Sparse Low-Rank
                 Representation of Audio Features",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1905--1917",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Maezawa and K. Itoyama and K. Yoshii and H. G.
  title =        "Nonparametric {Bayesian} Dereverberation of Power
                 Spectrograms Based on Infinite-Order Autoregressive
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1918--1930",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Krawczyk and T. Gerkmann",
  title =        "{STFT} Phase Reconstruction in Voiced Speech for an
                 Improved Single-Channel Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1931--1940",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "V. Khanagha and K. Daoudi and H. M. Yahia",
  title =        "Detection of Glottal Closure Instants Based on the
                 Microcanonical Multiscale Formalism",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1941--1950",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Venturini and L. Zao and R. Coelho",
  title =        "On speech features fusion, $ \alpha $-integration
                 {Gaussian} modeling and multi-style training for noise
                 robust speaker classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1951--1964",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "P. Foster and M. Mauch and S. Dixon",
  title =        "Sequential Complexity as a Descriptor for Musical
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1965--1977",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Gang Liu and J. H. L. Hansen",
  title =        "An Investigation into Back-end Advancements for
                 Speaker Recognition in Multi-Session and Noisy
                 Enrollment Scenarios",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1978--1992",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jitong Chen and Yuxuan Wang and Deliang Wang",
  title =        "A Feature Study for Classification-Based Speech
                 Separation at Low Signal-to-Noise Ratios",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "1993--2002",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. van Mourik and D. Murphy",
  title =        "Explicit Higher-Order {FDTD} Schemes for {$3$D} Room
                 Acoustic Simulation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2003--2011",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Pei Chee Yong and S. Nordholm and Hai Huyen Dam",
  title =        "Effective Binaural Multi-Channel Processing Algorithm
                 for Improved Environmental Presence",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2012--2024",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Chen and M. A. Hasegawa-Johnson",
  title =        "Mixed Stereo Audio Classification Using a Stereo-Input
                 Mixed-to-Panned Level Feature",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2025--2033",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Gongping Huang and J. Benesty and Tao Long and
                 Jingdong Chen",
  title =        "A Family of Maximum {SNR} Filters for Noise
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2034--2047",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Su Yan and Xiaojun Wan",
  title =        "{SRRank}: Leveraging Semantic Roles for Extractive
                 Multi-Document Summarization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2048--2058",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Tachibana and N. Ono and H. Kameoka and S.
  title =        "Harmonic\slash Percussive Sound Separation Based on
                 Anisotropic Smoothness of Spectrograms",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2059--2073",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. M. Gil-Cacho and T. van Waterschoot and M. Moonen
                 and S. H. Jensen",
  title =        "A Frequency-Domain Adaptive Filter {(FDAF)} Prediction
                 Error Method {(PEM)} Framework for Double-Talk-Robust
                 Acoustic Echo Cancellation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2074--2086",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qi Wang and W. L. Woo and S. S. Dlay",
  title =        "Informed Single-Channel Speech Separation Using
                 {HMM--GMM} User-Generated Exemplar Source",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2087--2100",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Erro and T.-C. Zorila and Y. Stylianou",
  title =        "Enhancing the Intelligibility of Statistically
                 Generated Synthetic Speech by Means of
                 Noise-Independent Modifications",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2101--2111",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi Jiang and Deliang Wang and Runsheng Liu and
                 ZhenMing Feng",
  title =        "Binaural Classification for Reverberant Speech
                 Segregation Using Deep Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2112--2121",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Li Su and Hsin-Ming Lin and Yi-Hsuan Yang",
  title =        "Sparse Modeling of Magnitude and Phase-Derived Spectra
                 for Playing Technique Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2122--2132",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "V. V. Reddy and A. W. H. Khong and Boon Poh Ng",
  title =        "Unambiguous Speech {DOA} Estimation Under Spatial
                 Aliasing Conditions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2133--2145",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Mohammadi and S. S. Sarfjoo and C. Demiroglu",
  title =        "Eigenvoice Speaker Adaptation with Minimal Data for
                 Statistical Speech Synthesis Systems Using a {MAP}
                 Approach and Nearest-Neighbors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2146--2157",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kun Han and Deliang Wang",
  title =        "Neural Network Based Pitch Tracking in Very Noisy
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2158--2168",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yongsheng Mu and Peifeng Ji and Wei Ji and Ming Wu and
                 Jun Yang",
  title =        "Modeling and Compensation for the Distortion of
                 Parametric Loudspeakers Using a One-Dimension
                 {Volterra} Filter",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2169--2181",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "O. Thiergart and M. Taseska and E. A. P. Habets",
  title =        "An Informed Parametric Spatial Filter Based on
                 Instantaneous Direction-of-Arrival Estimates",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2182--2196",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. F. Santos and T. H. Falk",
  title =        "Updating the {SRMR--CI} Metric for Improved
                 Intelligibility Prediction for Cochlear Implant Users",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2197--2206",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Seon Man Kim and Hong Kook Kim",
  title =        "Direction-of-Arrival Based {SNR} Estimation for
                 Dual-Microphone Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2207--2217",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Otsuka and K. Ishiguro and T. Yoshioka and H.
                 Sawada and H. G. Okuno",
  title =        "Multichannel Sound Source Dereverberation and
                 Separation for Arbitrary Number of Sources Based on
                 {Bayesian} Nonparametrics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2218--2232",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Traa and P. Smaragdis",
  title =        "Multichannel Source Separation and Tracking With
                 {RANSAC} and Directional Statistics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2233--2243",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Weifeng Li and Longbiao Wang and Yicong Zhou and J.
                 Dines and M. Magimai-Doss and H. Bourlard and Qingmin
  title =        "Feature Mapping of Multiple Beamformed Sources for
                 Robust Overlapping Speech Recognition Using a
                 Microphone Array",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2244--2255",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Y. FanChiang and C.-W. Wei and Y.-L. Meng and Y.-W.
                 Lin and S.-J. Jou and T.-S. Chang",
  title =        "Correction to {``Low Complexity Formant Estimation
                 Adaptive Feedback Cancellation for Hearing Aids Using
                 Pitch Based Processing'' [Aug {\bf 14} 1248--1259]}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2256--2256",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  note =         "See \cite{FanChiang:2014:LCF}.",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "List of Reviewers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2257--2259",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2260--2261",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2262--2263",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "2014 Index {IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing} Vol. 22",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "2264--2288",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "B1686",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "C1",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "C2",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "C3",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page --- back cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "22",
  number =       "12",
  pages =        "C4",
  month =        dec,
  year =         "2014",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:40 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "1--2",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "3--4",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H Li",
  title =        "Inaugural Editorial: Embracing New Opportunities for
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "5--6",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yong Xu and Jun Du and Li-Rong Dai and Chin-Hui Lee",
  title =        "A Regression Approach to Speech Enhancement Based on
                 Deep Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "7--19",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Phan and M. Maas and R. Mazur and A. Mertins",
  title =        "Random Regression Forests for Acoustic Event Detection
                 and Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "20--31",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuntao Wu and L. Amir and J. R. Jensen and Guisheng
  title =        "Joint Pitch and {DOA} Estimation Using the {ESPRIT}
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "32--45",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. Decorsiere and P. L. S{\o}ndergaard and E. N.
                 MacDonald and T. Dau",
  title =        "Inversion of Auditory Spectrograms, Traditional
                 Spectrograms, and Other Envelope Representations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "46--56",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Poignant and L. Besacier and G. Qu{\'e}not",
  title =        "Unsupervised Speaker Identification in {TV} Broadcast
                 Based on Written Names",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "57--68",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Renjie Tong and Yingyue Zhou and Long Zhang and
                 Guangzhao Bao and Zhongfu Ye",
  title =        "A Robust Time-Frequency Decomposition Model for
                 Suppression of Mixed {Gaussian}-Impulse Noise in Audio
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "69--79",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Ahani and S. Ghaemmaghami and Z. J. Wang",
  title =        "A Sparse Representation-Based Wavelet Domain Speech
                 Steganography Method",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "80--91",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Narayanan and Deliang Wang",
  title =        "Improving Robustness of Deep Neural Network Acoustic
                 Models via Speech Separation and Joint Adaptive
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "92--101",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rongfeng Su and Xunying Liu and Lan Wang",
  title =        "Automatic Complexity Control of Generalized Variable
                 Parameter {HMMs} for Noise Robust Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "102--114",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zixing Zhang and E. Coutinho and Jun Deng and B.
  title =        "Cooperative Learning and its Application to Emotion
                 Recognition from Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "115--126",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Pei-hao Su and Chuan-hsun Wu and Lin-shan Lee",
  title =        "A Recursive Dialogue Game for Personalized
                 Computer-Aided Pronunciation Training",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "127--141",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Rakotomamonjy and G. Gasso",
  title =        "Histogram of Gradients of Time--Frequency
                 Representations for Audio Scene Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "142--153",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. A. Khoubrouy and I. M. S. Panahi and J. H. L.
  title =        "Howling Detection in Hearing Aids Based on Generalized
                 {Teager--Kaiser} Operator",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "154--161",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. B. B. Nielsen and J. Nielsen and J. Larsen",
  title =        "Perception-Based Personalization of Hearing Aids Using
                 {Gaussian} Processes and Active Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "162--173",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. R. Jensen and M. G. Christensen and J. Benesty and
                 S. H. Jensen",
  title =        "Joint Spatio-Temporal Filtering Methods for {DOA} and
                 Fundamental Frequency Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "174--185",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Jensen and Zheng-Hua Tan",
  title =        "Minimum Mean-Square Error Estimation of Mel-Frequency
                 Cepstral Features --- A Theoretically Consistent
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "186--197",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "C.-D. Martinez-Hinarejos and J.-M. Benedi and V.
  title =        "Unsegmented Dialogue Act Annotation and Decoding With
                 {$N$}-Gram Transducers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "198--211",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lin Wang and Zhe Chen and Fuliang Yin",
  title =        "A Novel Hierarchical Decomposition Vector Quantization
                 Method for High-Order {LPC} Parameters",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "212--221",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "222--222",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "223--224",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "225--226",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "227--227",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Front} cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "C1",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "C2",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "C3",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page --- back cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "1",
  pages =        "C4",
  month =        jan,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:41 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "223--224",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "225--226",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Guang Hua and J. Goh and V. L. L. Thing",
  title =        "Time-Spread Echo-Based Audio Watermarking With
                 Optimized Imperceptibility and Robustness",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "227--239",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "O. Schwartz and S. Gannot and E. A. P. Habets",
  title =        "Multi-Microphone Speech Dereverberation and Noise
                 Reduction Using Relative Early Transfer Functions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "240--251",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "E. Molina and L. J. Tardon and A. M. Barbancho and I.
  title =        "{SiPTH}: Singing Transcription Based on Hysteresis
                 Defined on the Pitch-Time Curve",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "252--263",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Haipeng Wang and Tan Lee and Cheung-Chi Leung and Bin
                 Ma and Haizhou Li",
  title =        "Acoustic Segment Modeling with Spectral Clustering
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "264--277",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "V. Arora and L. Behera",
  title =        "Multiple {F0} Estimation and Source Clustering of
                 Polyphonic Music Audio Using {PLCA} and {HMRFs}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "278--287",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. Sugiura and Y. Kamamoto and N. Harada and H.
                 Kameoka and T. Moriya",
  title =        "Resolution Warped Spectral Representation for
                 Low-Delay and Low-Bit-Rate Audio {Coder}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "288--299",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chao Weng and B.-H. F. Juang",
  title =        "Discriminative Training Using Non-Uniform Criteria for
                 Keyword Spotting on Spontaneous Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "300--312",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Y. Matsuyama and A. Saito and S. Fujie and T.
  title =        "Automatic Expressive Opinion Sentence Generation for
                 Enjoyable Conversational Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "313--326",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "P. N. Petkov and W. B. Kleijn",
  title =        "Spectral Dynamics Recovery for Enhanced Speech
                 Intelligibility in Noise",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "327--338",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "E. Bicici and D. Yuret",
  title =        "Optimizing Instance Selection for Statistical Machine
                 Translation with Feature Decay Algorithms",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "339--350",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mengqiu Zhang and R. A. Kennedy and T. D. Abhayapala",
  title =        "Empirical Determination of Frequency Representation in
                 Spherical Harmonics-Based {HRTF} Functional Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "351--360",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zu-Ren Feng and Qing Zhou and Jun Zhang and Ping Jiang
                 and Xue-Wen Yang",
  title =        "A Target Guided Subband Filter for Acoustic Event
                 Detection in Noisy Environments Using Wavelet Packets",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "361--372",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "N. Hirayama and K. Yoshino and K. Itoyama and S. Mori
                 and H. G. Okuno",
  title =        "Automatic Speech Recognition for Mixed Dialect
                 Utterances by Mixing Dialect Language Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "373--382",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Schasse and T. Gerkmann and R. Martin and W. Sorgel
                 and T. Pilgrim and H. Puder",
  title =        "Two-Stage Filter-Bank System for Improved
                 Single-Channel Noise Reduction in Hearing Aids",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "383--393",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "B. Schwartz and S. Gannot and E. A. P. Habets",
  title =        "Online Speech Dereverberation Using {Kalman} Filter
                 and {EM} Algorithm",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "394--406",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "B. Gerazov and Z. Ivanovski",
  title =        "Kernel Power Flow Orientation Coefficients for
                 Noise-Robust Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "407--419",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "420--421",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "422--423",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "424--424",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Front} cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "C1",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "C2",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "C3",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page --- back cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "2",
  pages =        "C4",
  month =        feb,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "425--426",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Li and M. Federico and X. He and H. Meng and I.
  title =        "Introduction to the Special Section on Continuous
                 Space and Related Methods in Natural Language
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "427--430",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Adel and Ngoc Thang Vu and K. Kirchhoff and D.
                 Telaar and T. Schultz",
  title =        "Syntactic and Semantic Features For Code-Switching
                 Factored Language Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "431--440",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaodong Zeng and D. F. Wong and L. S. Chao and I.
  title =        "Graph-Based Lexicon Regularization for {PCFG} With
                 Latent Annotations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "441--450",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wenliang Chen and Min Zhang and Yue Zhang",
  title =        "Distributed Feature Representations for Dependency
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "451--460",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ruiji Fu and Jiang Guo and Bing Qin and Wanxiang Che
                 and Haifeng Wang and Ting Liu",
  title =        "Learning Semantic Hierarchies: a Continuous Vector
                 Space Approach",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "461--471",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. E. Banchs and L. F. D'Haro and Haizhou Li",
  title =        "Adequacy--Fluency Metrics: Evaluating {MT} in the
                 Continuous Space Model Framework",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "472--482",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Deyi Xiong and Min Zhang and Xing Wang",
  title =        "Topic-Based Coherence Modeling for Statistical Machine
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "483--493",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "B. Hutchinson and M. Ostendorf and M. Fazel",
  title =        "A Sparse Plus Low-Rank Exponential Language Model for
                 Limited Resource Scenarios",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "494--504",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. A. A. Rashwan and A. A. {Al Sallab} and H. M.
                 Raafat and A. Rafea",
  title =        "Deep Learning Framework with Confused Sub-Set
                 Resolution Architecture for Automatic {Arabic}
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "505--516",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Sundermeyer and H. Ney and R. Schluter",
  title =        "From Feedforward to Recurrent {LSTM} Neural Networks
                 for Language Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "517--529",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "G. Mesnil and Y. Dauphin and Kaisheng Yao and Y.
                 Bengio and Li Deng and D. Hakkani-Tur and Xiaodong He
                 and L. Heck and G. Tur and Dong Yu and G. Zweig",
  title =        "Using Recurrent Neural Networks for Slot Filling in
                 Spoken Language Understanding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "530--539",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "I. McLoughlin and Haomin Zhang and Zhipeng Xie and Yan
                 Song and Wei Xiao",
  title =        "Robust Sound Event Classification Using Deep Neural
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "540--552",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Zahoransky and I. Polasek",
  title =        "Text Search of Surnames in Some {Slavic} and Other
                 Morphologically Rich Languages Using Rule Based
                 Phonetic Algorithms",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "553--563",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yow-Bang Wang and Lin-shan Lee",
  title =        "Supervised Detection and Unsupervised Discovery of
                 Pronunciation Error Patterns for Computer-Assisted
                 Language Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "564--579",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Nakashika and T. Takiguchi and Y. Ariki",
  title =        "Voice Conversion Using {RNN} Pre-Trained by Recurrent
                 Temporal Restricted {Boltzmann} Machines",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "580--587",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "N. Obin and P. Lanchantin",
  title =        "Symbolic Modeling of Prosody: From Linguistics to
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "588--599",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "601--602",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "603--604",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE} Member Digital Library",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "606--606",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "B600",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "C1",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "C2",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "C3",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "3",
  pages =        "C4",
  month =        mar,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:42 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "601--602",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "603--604",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Langzhou Chen and N. Braunschweiler and M. J. F.
  title =        "Speaker and Expression Factorization for Audiobook
                 Data: Expressiveness and Transplantation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "605--618",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xinjie Zhou and Xiaojun Wan and Jianguo Xiao",
  title =        "{CLOpinionMiner}: Opinion Target Extraction in a
                 Cross-Language Scenario",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "619--630",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Pan Zhou and Hui Jiang and Li-Rong Dai and Yu Hu and
                 Qing-Feng Liu",
  title =        "State-Clustering Based Multiple Deep Neural Networks
                 Modeling Approach for Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "631--642",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ying Hu and Guizhong Liu",
  title =        "Separation of Singing Voice Using Nonnegative Matrix
                 Partial Co-Factorization for Singer Identification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "643--653",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Kitamura and H. Saruwatari and H. Kameoka and Yu.
                 Takahashi and K. Kondo and S. Nakamura",
  title =        "Multichannel Signal Separation Combining Directional
                 Clustering and Nonnegative Matrix Factorization with
                 Spectrogram Restoration",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "654--669",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Van-Khanh Mai and D. Pastor and A. Aissa-El-Bey and R.
  title =        "Robust Estimation of Non-Stationary Noise Power
                 Spectrum for Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "670--682",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "E. Blanco and D. Moldovan",
  title =        "A Semantic Logic-Based Approach to Determine Textual
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "683--693",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Myung Jong Kim and Younggwan Kim and Hoirin Kim",
  title =        "Automatic Intelligibility Assessment of Dysarthric
                 Speech Using Phonologically-Structured Sparse Linear
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "694--704",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "G. Aneeja and B. Yegnanarayana",
  title =        "Single Frequency Filtering Approach for Discriminating
                 Speech and Nonspeech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "705--717",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Deleforge and R. Horaud and Y. Y. Schechner and L.
  title =        "Co-Localization of Audio Sources in Images Using
                 Binaural Features and Locally-Linear Regression",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "718--731",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Dov and R. Talmon and I. Cohen",
  title =        "Audio-Visual Voice Activity Detection Using Diffusion
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "732--745",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Habibi and A. Popescu-Belis",
  title =        "Keyword Extraction and Clustering for Document
                 Recommendation in Conversations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "746--759",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "N. Mamun and W. A. Jassim and M. S. A. Zilany",
  title =        "Prediction of Speech Intelligibility Using a Neurogram
                 Orthogonal Polynomial Measure {(NOPM)}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "760--773",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "E. {De Sena} and N. Antonello and M. Moonen and T. van
  title =        "On the Modeling of Rectangular Geometries in Room
                 Acoustic Simulations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "774--786",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hao Huang and Haihua Xu and Xianhui Wang and W.
  title =        "Maximum {F1}-Score Discriminative Training Criterion
                 for Automatic Mispronunciation Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "787--797",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chung-Che Wang and J.-S. R. Jang",
  title =        "Improving Query-by-Singing\slash Humming by Combining
                 Melody and Lyric Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "798--806",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "807--808",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "809--810",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE} Member Digital Library",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "812--812",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "C1",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "C2",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "C3",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "4",
  pages =        "C4",
  month =        apr,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "813--814",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "815--816",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "F. Krebs and A. Holzapfel and A. T. Cemgil and G.
  title =        "Inferring Metrical Structure in Music Using Particle
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "817--827",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Janghoon Cho and C. D. Yoo",
  title =        "Underdetermined Convolutive {BSS}: {Bayes} Risk
                 Minimization Based on a Mixture of Super-{Gaussian}
                 Posterior Approximation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "828--839",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hao Mu and Woon-Seng Gan and Ee-Leng Tan",
  title =        "An Objective Analysis Method for Perceptual Quality of
                 a Virtual {Bass} System",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "840--850",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. C. Hendriks and J. B. Crespo and J. Jensen and C.
                 H. Taal",
  title =        "Optimal Near-End Speech Intelligibility Improvement
                 Incorporating Additive Noise and Late Reverberation
                 Under an Approximation of the Short-Time {SII}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "851--862",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. H. Abdelaziz and S. Zeiler and D. Kolossa",
  title =        "Learning Dynamic Stream Weights For
                 Coupled-{HMM}-Based Audio-Visual Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "863--876",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. Berkun and I. Cohen and J. Benesty",
  title =        "Combined Beamformers for Robust Broadband Regularized
                 Superdirective Beamforming",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "877--886",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Breebaart",
  title =        "Evaluation of Statistical Inference Tests Applied to
                 Subjective Audio Quality Data With Small Sample Size",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "887--897",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Zivanovi{\'c}",
  title =        "Harmonic Bandwidth Companding for Separation of
                 Overlapping Harmonics in Pitched Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "898--908",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jen-Tzung Chien",
  title =        "{Laplace} Group Sensing for Acoustic Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "909--922",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ying Wei and Yinfeng Wang",
  title =        "Design of Low Complexity Adjustable Filter Bank for
                 Personalized Hearing Aid Solutions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "923--931",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Perez-Carrillo and M. M. Wanderley",
  title =        "Indirect Acquisition of Violin Instrumental Controls
                 from Audio Signal with Hidden {Markov} Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "932--940",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Mansikkaniemi and M. Kurimo",
  title =        "Adaptation of Morph-Based Speech Recognition for
                 Foreign Names and Acronyms",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "941--950",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "953--954",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "955--956",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "957--957",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "B951--B952",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Front} cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "C1",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "C2",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "C3",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "5",
  pages =        "C4",
  month =        may,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:43 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "953--954",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "955--956",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shih-Hung Liu and Kuan-Yu Chen and B. Chen and
                 Hsin-Min Wang and Hsu-Chun Yen and Wen-Lian Hsu",
  title =        "Combining Relevance Language Modeling and Clarity
                 Measure for Extractive Speech Summarization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "957--969",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Niedzwiecki and M. Ciolek and K. Cisowski",
  title =        "Elimination of Impulsive Disturbances From Stereo
                 Audio Recordings Using Vector Autoregressive Modeling
                 and Variable-order {Kalman} Filtering",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "970--981",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kun Han and Yuxuan Wang and Deliang Wang and W. S.
                 Woods and I. Merks and Tao Zhang",
  title =        "Learning Spectral Mapping for Speech Dereverberation
                 and Denoising",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "982--992",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "P. Foster and S. Dixon and A. Klapuri",
  title =        "Identifying Cover Songs Using Information-Theoretic
                 Measures of Similarity",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "993--1005",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Schwarz and W. Kellermann",
  title =        "Coherent-to-Diffuse Power Ratio Estimation for
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "1006--1018",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Cernak and P. N. Garner and A. Lazaridis and P.
                 Motlicek and Xingyu Na",
  title =        "Incremental Syllable-Context Phonetic Vocoding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "1019--1030",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Rouvier and S. Oger and G. Linares and D. Matrouf
                 and B. Merialdo and Y. Li",
  title =        "Audio-Based Video Genre Identification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "1031--1041",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Kameoka and K. Yoshizato and T. Ishihara and K.
                 Kadowaki and Y. Ohishi and K. Kashino",
  title =        "Generative Modeling of Voice Fundamental Frequency
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "1042--1053",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dejan Markovi{\'c} and Fabio Antonacci and Augusto
                 Sarti and Stefano Tubaro",
  title =        "Multiview Soundfield Imaging in the Projective Ray
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "1054--1067",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. P. Bates and Z. Khalid and R. A. Kennedy",
  title =        "Novel Sampling Scheme on the Sphere for Head-Related
                 Transfer Function Measurements",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "1068--1081",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Maoshen Jia and Ziyu Yang and Changchun Bao and
                 Xiguang Zheng and C. Ritz",
  title =        "Encoding Multiple Audio Objects Using Intra-Object
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "1082--1095",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "1096--1097",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "1098--1099",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "1100--1100",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Front} cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "C1",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "C2",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "C3",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "6",
  pages =        "C4",
  month =        jun,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1101--1102",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1103--1104",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. McVicar and S. Fukayama and M. Goto",
  title =        "{AutoGuitarTab}: Computer-Aided Composition of Rhythm
                 and Lead Guitar Parts in the Tablature Space",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1105--1117",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. {Van Segbroeck} and R. Travadi and S. S.
  title =        "Rapid Language Identification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1118--1129",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Marelli and R. Baumgartner and P. Majdak",
  title =        "Efficient Approximation of Head-Related Transfer
                 Functions in Subbands for Accurate Sound Localization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1130--1143",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ching-Feng Yeh and Lin-shan Lee",
  title =        "An Improved Framework for Recognizing Highly
                 Imbalanced Bilingual Code-Switched Lectures with
                 Cross-Language Acoustic Modeling and Frame-Level
                 Language Identification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1144--1159",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Basaran and A. T. Cemgil and E. Anarim",
  title =        "A Probabilistic Model-Based Approach for Aligning
                 Multiple Audio Sequences",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1160--1171",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dongpeng Chen and B. K.-W. Mak",
  title =        "Multitask Learning of Deep Neural Networks for
                 Low-Resource Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1172--1183",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Meyer and N. Hajlaoui and A. Popescu-Belis",
  title =        "Disambiguating Discourse Connectives for Statistical
                 Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1184--1197",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "U. Remes and A. Ramirez Lopez and K. Palomaki and M.
  title =        "Bounded Conditional Mean Imputation with Observation
                 Uncertainties and Acoustic Model Adaptation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1198--1208",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rui Wang and Hai Zhao and Bao-Liang Lu and M. Utiyama
                 and E. Sumita",
  title =        "Bilingual Continuous-Space Language Model Growing for
                 Statistical Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1209--1220",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tze Yuang Chong and R. E. Banchs and Eng Siong Chng
                 and Haizhou Li",
  title =        "Decoupling Word-Pair Distance and Co-occurrence
                 Information for Effective Long History Context Language
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1221--1232",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Meng Sun and Yinan Li and J. F. Gemmeke and Xiongwei
  title =        "Speech Enhancement Under Low {SNR} Conditions Via
                 Noise Estimation Using Sparse and Low-Rank {NMF} with
                 {Kullback--Leibler} Divergence",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1233--1242",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1245--1246",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "1247--1248",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "B1243--B1244",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "C1",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "C2",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "C3",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "7",
  pages =        "C4",
  month =        jul,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:44 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1245--1246",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1247--1248",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Momeni and H. R. Abutalebi and A. Tadaion",
  title =        "Joint Detection and Estimation of Speech Spectral
                 Amplitude Using Noncontinuous Gain Functions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1249--1258",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jen-Tzung Chien",
  title =        "Hierarchical {Pitman--Yor--Dirichlet} Language Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1259--1272",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Fallahpour and D. Megias",
  title =        "Audio Watermarking Based on {Fibonacci} Numbers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1273--1282",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "P. Mowlaee and J. Kulmer",
  title =        "Phase Estimation in Single-Channel Speech Enhancement:
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1283--1294",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Morchid and M. Bouallegue and R. Dufour and G.
                 Linares and D. Matrouf and R. {De Mori}",
  title =        "Compact Multiview Representation of Documents Based on
                 the Total Variability Space",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1295--1308",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. Sugiura and Y. Kamamoto and N. Harada and H.
                 Kameoka and T. Moriya",
  title =        "Optimal Coding of Generalized-{Gaussian}-Distributed
                 Frequency Spectra for Low-Delay Audio {Coder} With
                 Powered All-Pole Spectrum Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1309--1321",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kuan-Yu Chen and Shih-Hung Liu and B. Chen and
                 Hsin-Min Wang and Ea-Ee Jan and Wen-Lian Hsu and
                 Hsin-Hsi Chen",
  title =        "Extractive Broadcast News Summarization Leveraging
                 Recurrent Neural Network Language Modeling Techniques",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1322--1334",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Z. Koldovsky and J. Malek and S. Gannot",
  title =        "Spatial Source Subtraction Based on Incomplete
                 Measurements of Relative Transfer Function",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1335--1347",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Dimitriadis and E. Bocchieri",
  title =        "Use of Micro-Modulation Features in Large Vocabulary
                 Continuous Speech Recognition Tasks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1348--1357",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xun Wang and Y. Yoshida and T. Hirao and M. Nagata and
                 K. Sudoh",
  title =        "Summarization Based on Task-Oriented Discourse
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1358--1367",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "C. Spa and A. Rey and E. Hernandez",
  title =        "A {GPU} Implementation of an Explicit Compact {FDTD}
                 Algorithm with a Digital Impedance Filter for Room
                 Acoustics Applications",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1368--1380",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1381--1382",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "1383--1384",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "C1",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "C2",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "C3",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "8",
  pages =        "C4",
  month =        aug,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1385--1386",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1387--1388",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lin-shan Lee and J. Glass and Hung-yi Lee and Chun-an
  title =        "Spoken Content Retrieval --- Beyond Cascading Speech
                 Recognition with Text Retrieval",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1389--1420",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yishan Jiao and V. Berisha and Ming Tu and J. Liss",
  title =        "Convex Weighting Criteria for Speaking Rate
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1421--1430",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jianjun He and Woon-Seng Gan and Ee-Leng Tan",
  title =        "Primary-Ambient Extraction Using Ambient Spectrum
                 Estimation for Immersive Spatial Audio Reproduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1431--1444",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  note =         "See comments \cite{Lu:2024:CXP}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qing Shen and Wei Liu and Wei Cui and Siliang Wu and
                 Y. D. Zhang and M. G. Amin",
  title =        "Low-Complexity Direction-of-Arrival Estimation Based
                 on Wideband Co-Prime Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1445--1456",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yu-Ren Chien and Hsin-Min Wang and Shyh-Kang Jeng",
  title =        "An Acoustic-Phonetic Model of {F0} Likelihood for
                 Vocal Melody Extraction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1457--1468",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaodong Cui and V. Goel and B. Kingsbury",
  title =        "Data Augmentation for Deep Neural Network Acoustic
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1469--1477",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "E. {De Sena} and H. Hac{\i}habibo{\u{g}}lu and Z.
                 Cvetkovi{\'c} and J. O. Smith",
  title =        "Efficient Synthesis of Room Acoustics via Scattering
                 Delay Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1478--1492",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lin Wang and T. Gerkmann and S. Doclo",
  title =        "Noise Power Spectral Density Estimation Using {MaxNSR}
                 Blocking Matrix",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1493--1508",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Jukic and T. van Waterschoot and T. Gerkmann and S.
  title =        "Multi-Channel Linear Prediction-Based Speech
                 Dereverberation With Sparse Priors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1509--1520",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "P. Mowlaee and J. Kulmer",
  title =        "Harmonic Phase Estimation in Single-Channel Speech
                 Enhancement Using Phase Decomposition and {SNR}
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1521--1532",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1535--1536",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1537--1538",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "How can you get your idea to market first?",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "1539--1539",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "B1533--B1534",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "C1",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "C2",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "C3",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "9",
  pages =        "C4",
  month =        sep,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:45 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1535--1536",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1537--1538",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Tervo and A. Politis",
  title =        "Direction of Arrival Estimation of Reflections from
                 Room Impulse Responses Using a Spherical Microphone
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1539--1551",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jia-Ching Wang and Yu-Hao Chin and Bo-Wei Chen and
                 Chang-Hong Lin and Chung-Hsien Wu",
  title =        "Speech Emotion Verification Using Emotion Variance
                 Modeling and Discriminant Scale-Frequency Maps",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1552--1562",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Canclini and P. Bestagini and F. Antonacci and M.
                 Compagnoni and A. Sarti and S. Tubaro",
  title =        "A Robust and Low-Complexity Source Localization
                 Algorithm for Asynchronous Distributed Microphone
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1563--1575",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jianjun He and Woon-Seng Gan and Ee-Leng Tan",
  title =        "Time-Shifting Based Primary-Ambient Extraction for
                 Spatial Audio Reproduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1576--1588",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "P. Shah and I. Lewis and S. Grant and S. Angrignon",
  title =        "Nonlinear Acoustic Echo Cancellation Using Voltage and
                 Current Feedback",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1589--1599",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Li Su and Yi-Hsuan Yang",
  title =        "Combining Spectral and Temporal Representations for
                 Multipitch Estimation of Polyphonic Music",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1600--1612",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Fujioka and Y. Nagata and M. Abe",
  title =        "High-Precision Harmonic Distortion Level Measurement
                 of a Loudspeaker Using Adaptive Filters in a Noisy
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1613--1622",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tsz-Kin Hon and Lin Wang and J. D. Reiss and A.
  title =        "Audio Fingerprinting for Multi-Device
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1623--1636",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ye Tian and Zhe Chen and Fuliang Yin",
  title =        "Distributed {IMM}-Unscented {Kalman} Filter for
                 Speaker Tracking in Microphone Array Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1637--1647",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Na Li and Man-Wai Mak",
  title =        "{SNR}-Invariant {PLDA} Modeling in Nonparametric
                 Subspace for Robust Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1648--1659",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Vilkamo and S. Delikaris-Manias",
  title =        "Perceptual Reproduction of Spatial Sound Using
                 Loudspeaker-Signal-Domain Parametrization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1660--1669",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chao Weng and Dong Yu and M. L. Seltzer and J.
  title =        "Deep Neural Networks for Single-Channel Multi-Talker
                 Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1670--1679",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Ruhland and J. Bitzer and M. Brandt and S. Goetze",
  title =        "Reduction of {Gaussian}, Supergaussian, and Impulsive
                 Noise by Interpolation of the Binary Mask Residual",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1680--1691",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Y. Dorfan and S. Gannot",
  title =        "Tree-Based Recursive Expectation-Maximization
                 Algorithm for Localization of Acoustic Sources",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1692--1703",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing EDICS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1704--1705",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1706--1707",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "How can you get your idea to market first?",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "1708--1708",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "C1",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "C2",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "C3",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "10",
  pages =        "C4",
  month =        oct,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Sarmiento and I. Duran-Diaz and A. Cichocki and S.
  title =        "A Contrast Function Based on Generalized Divergences
                 for Solving the Permutation Problem in Convolved Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1713--1726",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaojia Zhao and Yuxuan Wang and Deliang Wang",
  title =        "Cochannel Speaker Identification in Anechoic and
                 Reverberant Conditions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1727--1736",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Liang-Yu Chen and J.-S. R. Jang",
  title =        "Automatic Pronunciation Scoring with Score Combination
                 by Learning to Rank and Class-Normalized {DP}-Based
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1737--1749",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Duyu Tang and Bing Qin and Furu Wei and Li Dong and
                 Ting Liu and Ming Zhou",
  title =        "A Joint Segmentation and Classification Framework for
                 Sentence Level Sentiment Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1750--1761",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "F.-M. Hoffmann and F. M. Fazi",
  title =        "Theoretical Study of Acoustic Circular Arrays With
                 Tangential Pressure Gradient Sensors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1762--1774",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "N. Souviraa-Labastie and A. Olivero and E. Vincent and
                 F. Bimbot",
  title =        "Multi-Channel Audio Source Separation Using Multiple
                 Deformed References",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1775--1787",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Baby and T. Virtanen and J. F. Gemmeke and H. {Van
  title =        "Coupled Dictionaries for Exemplar-Based Speech
                 Enhancement and Automatic Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1788--1799",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. T. Islam and C. Shahnaz and Wei-Ping Zhu and M. O.
  title =        "Speech Enhancement Based on Student Modeling of Teager
                 Energy Operated Perceptual Wavelet Packet Coefficients
                 and a Custom Thresholding Function",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1800--1811",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Quynh Thi Ngoc Do and S. Bethard and M.-F. Moens",
  title =        "Domain Adaptation in Semantic Role Labeling Using a
                 Neural Language Model and Linguistic Resources",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1812--1823",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Aragonda and C. S. Seelamantula",
  title =        "Demodulation of Narrowband Speech Spectrograms Using
                 the {Riesz} Transform",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1824--1834",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. T. Tran and E. Vincent and D. Jouvet",
  title =        "Nonparametric Uncertainty Estimation and Propagation
                 for Noise Robust {ASR}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1835--1846",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mei Tu and Yu Zhou and Chengqing Zong",
  title =        "Exploring Diverse Features for Statistical Machine
                 Translation Model Pruning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1847--1857",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "G. Okopal and S. Wisdom and L. Atlas",
  title =        "Speech Analysis With the Strong Uncorrelating
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1858--1868",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. F. Simon Galvez and S. J. Elliott and J. Cheer",
  title =        "Time Domain Optimization of Filters Used in a
                 Loudspeaker Array for Personal Audio",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1869--1878",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. H. Bokaei and H. Sameti and Yang Liu",
  title =        "Linear Discourse Segmentation of Multi-Party Meetings
                 Based on Local and Global Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1879--1891",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chung-Hsien Wu and Han-Ping Shen and Chun-Shan Hsu",
  title =        "Code-Switching Event Detection by Using a Latent
                 Language Space Model and the Delta-{Bayesian}
                 Information Criterion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1892--1903",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhangli Chen and V. Hohmann",
  title =        "Online Monaural Speech Enhancement Based on
                 Periodicity Analysis and A Priori {SNR} Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1904--1916",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Sarreshtedari and M. A. Akhaee and A. Abbasfar",
  title =        "A Watermarking Method for Digital Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1917--1925",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "N. Moritz and J. Anemuller and B. Kollmeier",
  title =        "An Auditory Inspired Amplitude Modulation Filter Bank
                 for Robust Feature Extraction in Automatic Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1926--1937",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yajie Miao and Hao Zhang and F. Metze",
  title =        "Speaker Adaptive Training of Deep Neural Network
                 Acoustic Models Using {$I$}-Vectors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1938--1949",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "V. Morfi and G. Degottex and A. Mouchtaris",
  title =        "Speech Analysis and Synthesis with a Computationally
                 Efficient Adaptive Harmonic Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1950--1962",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Dennis and H. D. Tran and Haizhou Li",
  title =        "Generalized {Hough} Transform for Speech Pattern
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1963--1972",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Feng Deng and Changchun Bao and W. B. Kleijn",
  title =        "Sparse Hidden {Markov} Models for Speech Enhancement
                 in Non-Stationary Noise Environments",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1973--1987",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. Ranjan and Woon-Seng Gan",
  title =        "Natural Listening over Headphones in Augmented Reality
                 Using Adaptive Filtering Techniques",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "1988--2002",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "L.-H. Chen and T. Raitio and C. Valentini-Botinhao and
                 Z.-H. Ling and J. Yamagishi",
  title =        "A Deep Generative Architecture for Postfiltering in
                 Statistical Parametric Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "2003--2014",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ho Seon Shin and T. Fingscheidt and Hong-Goo Kang",
  title =        "A Priori {SNR} Estimation Using Air- and
                 Bone-Conduction Microphones",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "2015--2025",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ji Wu and Miao Li and Chin-Hui Lee",
  title =        "A Probabilistic Framework for Representing Dialog
                 Systems and Entropy-Based Dialog Management Through
                 Dynamic Stochastic State Evolution",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "2026--2035",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Cumani",
  title =        "Fast Scoring of Full Posterior {PLDA} Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "2036--2045",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "V. Tourbabin and B. Rafaely",
  title =        "Direction of Arrival Estimation Using Microphone Array
                 Processing for Moving Humanoid Robots",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "2046--2058",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Y. J. Chu and S. C. Chan",
  title =        "A New Local Polynomial Modeling-Based Variable
                 Forgetting Factor {RLS} Algorithm and Its Acoustic
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "2059--2069",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "F. de-la-Calle-Silos and F. J. Valverde-Albacete and
                 A. Gallardo-Antolin and C. Pelaez-Moreno",
  title =        "Morphologically Filtered Power-Normalized Cochleograms
                 as Robust, Biologically Inspired Features for {ASR}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "2070--2080",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Hirao and M. Nishino and Y. Yoshida and J. Suzuki
                 and N. Yasuda and M. Nagata",
  title =        "Summarizing a Document by Trimming the Discourse
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "2081--2092",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chao Pan and Jingdong Chen and J. Benesty",
  title =        "Theoretical Analysis of Differential Microphone Array
                 Beamforming and an Improved Solution",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "11",
  pages =        "2093--2105",
  month =        nov,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Oct 5 06:29:46 MDT 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wanxiang Che and Yanyan Zhao and Honglei Guo and Zhong
                 Su and Ting Liu",
  title =        "Sentence Compression for Aspect-Based Sentiment
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2111--2124",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Sheaffer and M. van Walstijn and B. Rafaely and K.
  title =        "Binaural Reproduction of Finite Difference Simulations
                 Using Spherical Array Processing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2125--2135",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Po-Sen Huang and Minje Kim and M. Hasegawa-Johnson and
                 P. Smaragdis",
  title =        "Joint Optimization of Masks and Deep Recurrent Neural
                 Networks for Monaural Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2136--2147",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Heidel and Hsiang-Hung Lu and Lin-Shan Lee",
  title =        "Finding Complex Features for Guest Language Fragment
                 Recovery in Resource-Limited Code-Mixed Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2148--2161",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Marquardt and V. Hohmann and S. Doclo",
  title =        "Interaural Coherence Preservation in Multi-Channel
                 {Wiener} Filtering-Based Noise Reduction for Binaural
                 Hearing Aids",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2162--2176",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kai Yu and Kai Sun and Lu Chen and Su Zhu",
  title =        "Constrained {Markov} {Bayesian} Polynomial for
                 Efficient Dialogue State Tracking",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2177--2188",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "C. A. Anderson and P. D. Teal and M. A. Poletti",
  title =        "Spatially Robust Far-field Beamforming Using the {von
                 Mises(--Fisher)} Distribution",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2189--2197",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Schroder and S. Goetze and J. Anemuller",
  title =        "Spectro-Temporal {Gabor} Filterbank Features for
                 Acoustic Event Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2198--2208",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Inseok Heo and W. A. Sethares",
  title =        "Classification Based on Speech Rhythm via a Temporal
                 Alignment of Spoken Sentences",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2209--2216",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "P. Samarasinghe and T. Abhayapala and M. Poletti and
                 T. Betlehem",
  title =        "An Efficient Parameterization of the Room Transfer
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2217--2227",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yong Xiang and I. Natgunanathan and Yue Rong and Song
  title =        "Spread Spectrum-Based High Embedding Capacity
                 Watermarking Method for Audio Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2228--2237",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "In-Chul Yoo and Hyeontaek Lim and Dongsuk Yook",
  title =        "Formant-Based Robust Voice Activity Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2238--2245",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Hueber and L. Girin and X. Alameda-Pineda and G.
  title =        "Speaker-Adaptive Acoustic-Articulatory Inversion Using
                 Cascaded {Gaussian} Mixture Regression",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2246--2259",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hequn Bai and G. Richard and L. Daudet",
  title =        "Late Reverberation Synthesis: From Radiance Transfer
                 to Feedback Delay Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2260--2271",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "I. Bayram",
  title =        "A Multichannel Audio Denoising Formulation Based on
                 Spectral Sparsity",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2272--2285",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Delgado and X. Anguera and C. Fredouille and J.
  title =        "Fast Single- and Cross-Show Speaker Diarization Using
                 Binary Key Speaker Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2286--2297",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "W. S. Percybrooks and E. Moore",
  title =        "A New {HMM}-Based Voice Conversion Methodology
                 Evaluated on Monolingual and Cross-Lingual Conversion
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2298--2310",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Graja and M. Jaoua and L. H. Belguith",
  title =        "Statistical Framework with Knowledge Base Integration
                 for Robust Speech Understanding of the {Tunisian}
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2311--2321",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "F. Strasser and H. Puder",
  title =        "Adaptive Feedback Cancellation for Realistic Hearing
                 Aid Applications",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2322--2333",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yu Ting Yeung and Tan Lee and Cheung-Chi Leung",
  title =        "Supervised Single-Microphone Multi-Talker Speech
                 Separation with Conditional Random Fields",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2334--2342",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wenyu Jin and W. B. Kleijn",
  title =        "Theory and Design of Multizone Soundfield Reproduction
                 Using Sparse Methods",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2343--2355",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xionghu Zhong and J. R. Hopgood",
  title =        "A {Time--Frequency} Masking Based Random Finite Set
                 Particle Filtering Method for Multiple Acoustic Source
                 Detection and Tracking",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2356--2370",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "K. Vijayan and K. S. R. Murty",
  title =        "Analysis of Phase Spectrum of Speech Signals Using
                 Allpass Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2371--2383",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Marquardt and E. Hadad and S. Gannot and S. Doclo",
  title =        "Theoretical Analysis of Linearly Constrained
                 Multi-Channel {Wiener} Filtering Algorithms for
                 Combined Noise Reduction and Binaural Cue Preservation
                 in Binaural Hearing Aids",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2384--2397",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Zohrer and R. Peharz and F. Pernkopf",
  title =        "Representation Learning for Single-Channel Source
                 Separation and Bandwidth Extension",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2398--2409",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hao Fang and M. Ostendorf and P. Baumann and J.
  title =        "Exponential Language Modeling Using Morphological
                 Features and Multi-Task Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2410--2421",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. A. Carlin and M. Elhilali",
  title =        "A Framework for Speech Activity Detection Using
                 Adaptive Auditory Receptive Fields",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2422--2433",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Saito and K. Oishi and T. Furukawa",
  title =        "Convolutive Blind Source Separation Using an Iterative
                 Least-Squares Algorithm for Non-Orthogonal Approximate
                 Joint Diagonalization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2434--2448",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "E. Hadad and D. Marquardt and S. Doclo and S. Gannot",
  title =        "Theoretical Analysis of Binaural Transfer Function
                 {MVDR} Beamformers with Interference Cue Preservation
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2449--2464",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Guang Yang and R. F. Lyon and E. M. Drakakis",
  title =        "Psychophysical Evaluation of An Ultra-Low Power,
                 Analog Biomimetic Cochlear Implant Processor Filterbank
                 Architecture With Across Channels {AGC}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2465--2473",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "List of Reviewers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "23",
  number =       "12",
  pages =        "2474--2476",
  month =        dec,
  year =         "2015",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Nov 17 07:34:26 MST 2015",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "1--2",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "3--4",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Brognaux and T. Drugman",
  title =        "{HMM}-Based Speech Segmentation: Improvements of Fully
                 Automatic Approaches",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "5--15",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Tahon and L. Devillers",
  title =        "Towards a Small Set of Robust Acoustic Features for
                 Emotion Recognition: Challenges",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "16--28",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Behravan and V. Hautamaki and S. M. Siniscalchi and
                 T. Kinnunen and Chin-Hui Lee",
  title =        "$i$-Vector Modeling of Speech Attributes for Automatic
                 Foreign Accent Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "29--41",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. Saeidi and P. Alku and T. Backstrom",
  title =        "Feature Extraction Using Power-Law Adjusted Linear
                 Prediction With Application to Speaker Recognition
                 Under Severe Vocal Effort Mismatch",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "42--53",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "I. T. Ardekani and J. P. Kaipio and A. Nasiri and H.
                 Sharifzadeh and W. H. Abdulla",
  title =        "A Statistical Inverse Problem Approach to Online
                 Secondary Path Modeling in Active Noise Control",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "54--64",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Stafylakis and P. Kenny and M. J. Alam and M.
  title =        "Speaker and Channel Factors in Text-Dependent Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "65--78",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yanzhang He and P. Baumann and Hao Fang and B.
                 Hutchinson and A. Jaech and M. Ostendorf and E.
                 Fosler-Lussier and J. Pierrehumbert",
  title =        "Using Pronunciation-Based Morphological Subword Units
                 to Improve {OOV} Handling in Keyword Search",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "79--92",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Meng Sun and Xiongwei Zhang and H. {Van Hamme} and T.
                 F. Zheng",
  title =        "Unseen Noise Estimation Using Separable Deep Auto
                 Encoder for Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "93--104",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "L. Ferrer and Yun Lei and M. McLaren and N. Scheffer",
  title =        "Study of Senone-Based Deep Neural Network Approaches
                 for Spoken Language Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "105--116",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. I. Adalbjornsson and T. Kronvall and S. Burgess and
                 K. Astrom and A. Jakobsson",
  title =        "Sparse Localization of Harmonic Audio Sources",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "117--129",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Man-Wai Mak and Xiaomin Pang and Jen-Tzung Chien",
  title =        "Mixture of {PLDA} for Noise Robust {$I$}-Vector
                 Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "130--142",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "C. A. Anderson and P. D. Teal and M. A. Poletti",
  title =        "Spatial Correlation of Radial {Gaussian} and Uniform
                 Spherical Volume Near-Field Source Distributions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "143--150",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Torres and J. Gurlekian",
  title =        "Novel Estimation Method for the Superpositional
                 Intonation Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "151--160",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Bilbao and B. Hamilton and J. Botts and L.
  title =        "Finite Volume Time Domain Room Acoustics Simulation
                 under General Impedance Boundary Conditions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "161--173",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. H. Harati Nejad Torbati and J. Picone",
  title =        "A Doubly Hierarchical {Dirichlet} Process Hidden
                 {Markov} Model with a Non-Ergodic Structure",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "174--184",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jen-Tzung Chien and Po-Kai Yang",
  title =        "{Bayesian} Factorization and Learning for Monaural
                 Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "185--195",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. L. Alon and B. Rafaely",
  title =        "Beamforming with Optimal Aliasing Cancellation in
                 Spherical Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "196--210",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "211--212",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "213--214",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Special issue on sound scene and event analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "215",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Front} cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "C1",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "C2",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "C3",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "1",
  pages =        "C4",
  month =        jan,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "211--212",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "213--214",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "E. Rasumow and M. Hansen and S. van de Par and D.
                 Puschel and V. Mellert and S. Doclo and M. Blau",
  title =        "Regularization Approaches for Synthesizing {HRTF}
                 Directivity Patterns",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "215--225",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chao Pan and J. Benesty and Jingdong Chen",
  title =        "Design of Directivity Patterns with a Unique Null of
                 Maximum Multiplicity",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "226--235",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jeih-Weih Hung and Hsin-Ju Hsieh and Berlin Chen",
  title =        "Robust Speech Recognition via Enhancing the
                 Complex-Valued Acoustic Spectrum in Modulation Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "236--251",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiao-Lei Zhang and DeLiang Wang",
  title =        "Boosting Contextual Information for Deep Neural
                 Network Based Voice Activity Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "252--264",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. A. Tugtekin Turan and E. Erzin",
  title =        "Source and Filter Estimation for Throat-Microphone
                 Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "265--275",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "N. Mohammadiha and S. Doclo",
  title =        "Speech Dereverberation Using Non-Negative Convolutive
                 Transfer Function and Spectro-Temporal Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "276--289",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Sharma and S. Kaul",
  title =        "Two-Stage Supervised Learning-Based Method to Detect
                 Screams and Cries in Urban Environments",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "290--299",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaoguang Wu and Huawei Chen",
  title =        "Directivity Factors of the First-Order Steerable
                 Differential Array With Microphone Mismatches:
                 Deterministic and Worst-Case Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "300--315",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. I. Koutrouvelis and G. P. Kafentzis and N. D.
                 Gaubitch and R. Heusdens",
  title =        "A Fast Method for High-Resolution Voiced\slash
                 Unvoiced Detection and Glottal Closure\slash Opening
                 Instant Estimation of Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "316--328",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Nakamura and E. Nakamura and S. Sagayama",
  title =        "Real-Time Audio-to-Score Alignment of Music
                 Performances Containing Errors and Arbitrary Repeats
                 and Skips",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "329--339",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Bahne and A. Ahlen",
  title =        "Optimizing the Similarity of Loudspeaker-Room
                 Responses in Multiple Listening Positions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "340--353",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. M. Kates and K. H. Arehart",
  title =        "The {Hearing-Aid Audio Quality Index (HAAQI)}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "354--365",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Schepker and S. Doclo",
  title =        "A Semidefinite Programming Approach to Min-max
                 Estimation of the Common Part of Acoustic Feedback
                 Paths in Hearing Aids",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "366--377",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bong-Ki Lee and Joon-Hyuk Chang",
  title =        "Packet Loss Concealment Based on Deep Neural Networks
                 for Digital Speech Transmission",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "378--387",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "L. Bentivogli and N. Bertoldi and M. Cettolo and M.
                 Federico and M. Negri and M. Turchi",
  title =        "On the Evaluation of Adaptive Machine Translation for
                 Human Post-Editing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "388--399",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "400--401",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "402--403",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Special issue on sound scene and event analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "404",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Front} cover]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "C1",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "C2",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "C3",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "2",
  pages =        "C4",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Feb 9 07:50:48 MST 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "405--406",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "407--408",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Reinhard Sonnleitner and Gerhard Widmer",
  title =        "Robust Quad-Based Audio Fingerprinting",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "409--421",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Li Dong and Furu Wei and Ke Xu and Shixia Liu and Ming
  title =        "Adaptive Multi-Compositionality for Recursive Neural
                 Network Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "422--431",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zheng Lin and Xiaolong Jin and Xueke Xu and Yuanzhuo
                 Wang and Xueqi Cheng and Weiping Wang and Dan Meng",
  title =        "An Unsupervised Cross-Lingual Topic Model Framework
                 for Sentiment Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "432--444",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anil Nagathil and Claus Weihs and Rainer Martin",
  title =        "Spectral Complexity Reduction of Music Signals for
                 Mitigating Effects of Cochlear Hearing Loss",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "445--458",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tian Tan and Yanmin Qian and Kai Yu",
  title =        "Cluster Adaptive Training for Deep Neural Network
                 Based Acoustic Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "459--468",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Arne Leijon and Gustav Eje Henter and Martin
  title =        "{Bayesian} Analysis of Phoneme Confusion Matrices",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "469--482",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Donald S. Williamson and Yuxuan Wang and DeLiang
  title =        "Complex Ratio Masking for Monaural Speech Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "483--492",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Johannes Traa and David Wingate and Noah D. Stein and
                 Paris Smaragdis",
  title =        "Robust Source Localization and Enhancement With a
                 Probabilistic Steered Response Power Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "493--503",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sven Ewan Shepstone and Kong Aik Lee and Haizhou Li
                 and Zheng-Hua Tan and S{\o}ren Holdt Jensen",
  title =        "Total Variability Modeling Using Source-Specific
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "504--517",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Martin Schneider and Walter Kellermann",
  title =        "Multichannel Acoustic Echo Cancellation in the Wave
                 Domain With Increased Robustness to Nonuniqueness",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "518--529",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ken O'Hanlon and Hidehisa Nagano and Nicolas Keriven
                 and Mark D. Plumbley",
  title =        "Non-Negative Group Sparsity with Subspace Note
                 Modelling for Polyphonic Transcription",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "530--542",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Elior Hadad and Simon Doclo and Sharon Gannot",
  title =        "The Binaural {LCMV} Beamformer and its Performance
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "543--558",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Felipe Grijalva and Luiz Martini and Dinei Florencio
                 and Siome Goldenstein",
  title =        "A Manifold Learning Approach for Personalizing {HRTFs}
                 from Anthropometric Features",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "559--570",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lin Wang and Simon Doclo",
  title =        "Correlation Maximization-Based Sampling Rate Offset
                 Estimation for Distributed Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "571--582",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Nasim Radmanesh and Ian S. Burnett and Bhaskar D.
  title =        "A Lasso-{LS} Optimization with a Frequency Variable
                 Dictionary in a Multizone Sound System",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "583--593",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xin Liu and Changchun Bao",
  title =        "Audio Bandwidth Extension Based on Ensemble Echo State
                 Networks with Temporal Evolution",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "594--607",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{EDICS} Categories for {IEEE\slash ACM Transactions on
                 Audio, Speech, and Language Processing}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "608--609",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "610--611",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Special issue on sound scene and event analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "612",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Introducing {IEEE Collabratec}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "613",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "C1",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "C2",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "3",
  pages =        "C3",
  month =        mar,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:36 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "608--609",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "610--611",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Peifeng Li and Guodong Zhou",
  title =        "Joint Argument Inference in {Chinese} Event Extraction
                 with Argument Consistency and Event Relevance",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "612--622",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jianming Liu and Steven L. Grant",
  title =        "Proportionate Adaptive Filtering for Block-Sparse
                 System Identification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "623--630",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jesper Rindom Jensen and Jacob Benesty and Mads
                 Gr{\ae}sb{\o}ll Christensen",
  title =        "Noise Reduction with Optimal Variable Span Linear
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "631--644",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sidsel Marie N{\o}rholm and Jesper Rindom Jensen and
                 Mads Gr{\ae}sb{\o}ll Christensen",
  title =        "Enhancement and Noise Statistics Estimation for
                 Non-Stationary Voiced Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "645--658",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Daryush D. Mehta and Jarrad H. {Van Stan} and Robert
                 E. Hillman",
  title =        "Relationships Between Vocal Function Measures Derived
                 from an Acoustic Microphone and a Subglottal
                 Neck-Surface Accelerometer",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "659--668",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Herman Kamper and Aren Jansen and Sharon Goldwater",
  title =        "Unsupervised Word Segmentation and Lexicon Discovery
                 Using Acoustic Word Embeddings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "669--679",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ina Kodrasi and Simon Doclo",
  title =        "Joint Dereverberation and Noise Reduction Based on
                 Acoustic Multi-Channel Equalization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "680--693",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hamid Palangi and Li Deng and Yelong Shen and Jianfeng
                 Gao and Xiaodong He and Jianshu Chen and Xinying Song
                 and Rabab Ward",
  title =        "Deep Sentence Embedding Using Long Short-Term Memory
                 Networks: Analysis and Application to Information
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "694--707",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Michael Jeffet and Noam R. Shabtai and Boaz Rafaely",
  title =        "Theory and Perceptual Evaluation of the Binaural
                 Reproduction and Beamforming Tradeoff in the
                 Generalized Spherical Array Beamformer",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "708--718",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Pablo Peso Parada and Dushyant Sharma and Jose Lainez
                 and Daniel Barreda and Toon van Waterschoot and Patrick
                 A. Naylor",
  title =        "A Single-Channel Non-Intrusive {C50} Estimator
                 Correlated With Speech Recognition Performance",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "719--732",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ming-Hsiang Su and Chung-Hsien Wu and Yu-Ting Zheng",
  title =        "Exploiting Turn-Taking Temporal Evolution for
                 Personality Trait Perception in Dyadic Conversations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "733--744",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sadaf Abdul-Rauf and Holger Schwenk and Patrik Lambert
                 and Mohammad Nawaz",
  title =        "Empirical Use of Information Retrieval to Build
                 Synthetic Data for {SMT} Domain Adaptation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "745--754",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shinnosuke Takamichi and Tomoki Toda and Alan W. Black
                 and Graham Neubig and Sakriani Sakti and Satoshi
  title =        "Postfilters to Modify the Modulation Spectrum for
                 Statistical Parametric Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "755--767",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhizheng Wu and Phillip L. {De Leon} and Cenk
                 Demiroglu and Ali Khodabakhsh and Simon King and
                 Zhen-Hua Ling and Daisuke Saito and Bryan Stewart and
                 Tomoki Toda and Mirjam Wester and Junichi Yamagishi",
  title =        "Anti-Spoofing for Text-Independent Speaker
                 Verification: an Initial Database, Comparison of
                 Countermeasures, and Human Performance",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "768--783",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kristian Timm Andersen and Marc Moonen",
  title =        "Adaptive Time-Frequency Analysis for Noise Reduction
                 in an Audio Filter Bank With Low Delay",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "784--795",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhong-Qiu Wang and DeLiang Wang",
  title =        "A Joint Training Framework for Robust Automatic Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "796--806",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Huy Phan and Lars Hertel and Marco Maass and Radoslaw
                 Mazur and Alfred Mertins",
  title =        "Learning Representations for Nonspeech Audio Events
                 Through Their Similarities to Speech Patterns",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "807--822",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{EDICS} Categories for {IEEE\slash ACM Transactions on
                 Audio, Speech, and Language Processing}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "823--824",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Information for Authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "825--826",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Special issue on sound scene and event analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "827",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Introducing {IEEE Collabratec}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "828",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "C1",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "4",
  pages =        "C2",
  month =        apr,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "829--830",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "831--832",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. J. Tsai and Andreas Stolcke",
  title =        "Robust and Efficient Multiple Alignment of
                 Unsynchronized Meeting Recordings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "833--845",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Simon Receveur and Robin Wei{\ss} and Tim
  title =        "Turbo Automatic Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "846--862",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ricard Marxer and Hendrik Purwins",
  title =        "Unsupervised Incremental Online Learning and
                 Prediction of Musical Audio Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "863--874",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mohammad Adeli and Jean Rouat and Sean Wood and
                 St{\'e}phane Molotchnikoff and Eric Plourde",
  title =        "A Flexible Bio-Inspired Hierarchical Model for
                 Analyzing Musical Timbre",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "875--889",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Geliang Zhang and Simon Godsill",
  title =        "Fundamental Frequency Estimation in Speech Signals
                 With Variable Rate Particle Filters",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "890--900",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Nadine Kroher and Emilia G{\'o}mez",
  title =        "Automatic Transcription of Flamenco Singing From
                 Polyphonic Music Recordings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "901--913",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Fiete Winter and Jens Ahrens and Sascha Spors",
  title =        "On Analytic Methods for {$ 2.5$-D} Local Sound Field
                 Synthesis Using Circular Distributions of Secondary
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "914--926",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Siddharth Sigtia and Emmanouil Benetos and Simon
  title =        "An End-to-End Neural Network for Polyphonic Piano
                 Music Transcription",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "927--939",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Martin Krawczyk-Becker and Timo Gerkmann",
  title =        "Fundamental Frequency Informed Speech Enhancement in a
                 Flexible Statistical Framework",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "940--951",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Joseph Szurley and Alexander Bertrand and Bas {Van
                 Dijk} and Marc Moonen",
  title =        "Binaural Noise Cue Preservation in a Binaural Noise
                 Reduction System With a Remote Microphone Signal",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "952--966",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiao-Lei Zhang and DeLiang Wang",
  title =        "A Deep Ensemble Learning Method for Monaural Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "967--977",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Haotian Xu and Zhijian Ou",
  title =        "Scalable Discovery of Audio Fingerprint Motifs in
                 Broadcast Streams With Determinantal Point Process
                 Based Motif Clustering",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "978--989",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "990--991",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "992--993",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Special issue on sound scene and event analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "994",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Special Issue on Biosignal-based Spoken
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "995",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "C1",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "C2",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Power Electronics Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "C3",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "5",
  pages =        "C4",
  month =        may,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:37 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "990--991",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "992--993",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Asli Celikyilmaz and Ruhi Sarikaya and Minwoo Jeong
                 and Anoop Deoras",
  title =        "An Empirical Investigation of Word Class-Based
                 Features for Natural Language Understanding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "994--1005",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Duc Hoang Ha Nguyen and Xiong Xiao and Eng Siong Chng
                 and Haizhou Li",
  title =        "Feature Adaptation Using Linear Spectro-Temporal
                 Transform for Robust Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1006--1019",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaojun Qian and Helen Meng and Frank Soong",
  title =        "A Two-Pass Framework of Mispronunciation Detection and
                 Diagnosis for Computer-Aided Pronunciation Training",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1020--1028",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lijiang Chen and Xia Mao and Hong Yan",
  title =        "Text-Independent Phoneme Segmentation Combining {EGG}
                 and Speech Data",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1029--1037",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Vincent Mohammad Tavakoli and Jesper Rindom Jensen and
                 Mads Gr{\ae}sb{\o}ll Christensen and Jacob Benesty",
  title =        "A Framework for Speech Enhancement With Ad Hoc
                 Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1038--1051",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yan-You Chen and Chung-Hsien Wu and Yi-Chin Huang and
                 Shih-Lun Lin and Jhing-Fa Wang",
  title =        "Candidate Expansion and Prosody Adjustment for Natural
                 Speech Synthesis Using a Small Corpus",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1052--1065",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xueliang Zhang and Hui Zhang and Shuai Nie and
                 Guanglai Gao and Wenju Liu",
  title =        "A Pairwise Algorithm Using the Deep Stacking Network
                 for Speech Separation and Pitch Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1066--1078",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lin Wang and Tsz-Kin Hon and Joshua D. Reiss and
                 Andrea Cavallaro",
  title =        "An Iterative Approach to Source Counting and
                 Localization Using Two Distant Microphones",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1079--1093",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Se{\'a}n O'Leary and Axel R{\"o}bel",
  title =        "A Montage Approach to Sound Texture Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1094--1105",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chahid Ouali and Pierre Dumouchel and Vishwa Gupta",
  title =        "Fast Audio Fingerprinting System Using {GPU} and a
                 Clustering-Based Technique",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1106--1118",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Francisco Raposo and Ricardo Ribeiro and David Martins
                 de Matos",
  title =        "Using Generic Summarization to Improve Music
                 Information Retrieval Tasks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1119--1128",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lantian Li and Dong Wang and Chenhao Zhang and Thomas
                 Fang Zheng",
  title =        "Improving Short Utterance Speaker Recognition by
                 Modeling Speech Unit Classes",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1129--1139",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jalal Taghia and Rainer Martin",
  title =        "A Frequency-Domain Adaptive Line Enhancer With
                 Step-Size Control Based on Mutual Information for
                 Harmonic Noise Reduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1140--1154",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1155--1156",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1157--1158",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Special issue on sound scene and event analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1159",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Special Issue on Biosignal-based Spoken
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "1160",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "C1",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} publication information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "C2",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Power Electronics Society} Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "C3",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "6",
  pages =        "C4",
  month =        jun,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Min Gao and Jing Lu and Xiaojun Qiu",
  title =        "A Simplified Subband {ANC} Algorithm Without Secondary
                 Path Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "7",
  pages =        "1164--1174",
  month =        jul,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ryo Aihara and Tetsuya Takiguchi and Yasuo Ariki",
  title =        "Multiple Non-Negative Matrix Factorization for
                 Many-to-Many Voice Conversion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "7",
  pages =        "1175--1184",
  month =        jul,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kai Chen and Qiang Huo",
  title =        "Training Deep Bidirectional {LSTM} Acoustic Model for
                 {LVCSR} by a Context-Sensitive-Chunk {BPTT} Approach",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "7",
  pages =        "1185--1193",
  month =        jul,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Themos Stafylakis and Md. Jahangir Alam and Patrick
  title =        "Text-Dependent Speaker Recognition With Random Digit
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "7",
  pages =        "1194--1203",
  month =        jul,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "K. T. Deepak and S. R. Mahadeva Prasanna",
  title =        "Foreground Speech Segmentation and Enhancement Using
                 Glottal Closure Instants and Mel Cepstral
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "7",
  pages =        "1204--1218",
  month =        jul,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Habib Hajimolahoseini and Rassoul Amirfattahi and
                 Saeed Gazor and Hamid Soltanian-Zadeh",
  title =        "Robust Estimation and Tracking of Pitch Period Using
                 an Efficient {Bayesian} Filter",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "7",
  pages =        "1219--1229",
  month =        jul,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Subhasmita Sahoo and Aurobinda Routray",
  title =        "A Novel Method of Glottal Inverse Filtering",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "7",
  pages =        "1230--1241",
  month =        jul,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Gilles Degottex and Luc Ardaillon and Axel Roebel",
  title =        "Multi-Frame Amplitude Envelope Estimation for
                 Modification of Singing Voice",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "7",
  pages =        "1242--1254",
  month =        jul,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhizheng Wu and Simon King",
  title =        "Improving Trajectory Modelling for {DNN}-Based Speech
                 Synthesis by Using Stacked Bottleneck Features and
                 Minimum Generation Error Training",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "7",
  pages =        "1255--1265",
  month =        jul,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xabier Jaureguiberry and Emmanuel Vincent and Ga{\"e}l
  title =        "Fusion Methods for Speech Enhancement and Audio Source
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "7",
  pages =        "1266--1279",
  month =        jul,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rajib Lochan Das and Mrityunjoy Chakraborty",
  title =        "Improving the Performance of the {PNLMS} Algorithm
                 Using Norm Regularization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "7",
  pages =        "1280--1290",
  month =        jul,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Maja Taseska and Emanu{\"e}l A. P. Habets",
  title =        "Spotforming: Spatial Filtering With Distributed Arrays
                 for Position-Selective Sound Acquisition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "7",
  pages =        "1291--1304",
  month =        jul,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Guangyou Zhou and Zhiwen Xie and Tingting He and Jun
                 Zhao and Xiaohua Tony Hu",
  title =        "Learning the Multilingual Translation Representations
                 for Question Retrieval in Community Question Answering
                 via Non-Negative Matrix Factorization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "7",
  pages =        "1305--1314",
  month =        jul,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chanwoo Kim and Richard M. Stern",
  title =        "Power-Normalized Cepstral Coefficients {(PNCC)} for
                 Robust Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "7",
  pages =        "1315--1329",
  month =        jul,
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:38 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Henning Schepker and Simon Doclo",
  title =        "Least-Squares Estimation of the Common Pole-Zero
                 Filter of Acoustic Feedback Paths in Hearing Aids",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "8",
  pages =        "1334--1347",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:39 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hannes Pessentheiner and Martin Hagm{\"u}ller and
                 Gernot Kubin",
  title =        "Localization and Characterization of Multiple Harmonic
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "8",
  pages =        "1348--1363",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:39 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hanieh Khalilian and Ivan V. Baji{\'c} and Rodney G.
  title =        "Comparison of Loudspeaker Placement Methods for Sound
                 Field Reproduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "8",
  pages =        "1364--1379",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:39 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Cheng-Yen Yang and Chih-Wei Liu and Shyh-Jye Jou",
  title =        "A Systematic {ANSI S1.11} Filter Bank Specification
                 Relaxation and Its Efficient Multirate Architecture for
                 Hearing-Aid Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "8",
  pages =        "1380--1392",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:39 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bracha Laufer-Goldshtein and Ronen Talmon and Sharon
  title =        "Semi-Supervised Sound Source Localization Based on
                 Manifold Regularization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "8",
  pages =        "1393--1407",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:39 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dionyssos Kounades-Bastian and Laurent Girin and
                 Xavier Alameda-Pineda and Sharon Gannot and Radu
  title =        "A Variational {EM} Algorithm for the Separation of
                 Time-Varying Convolutive Audio Mixtures",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "8",
  pages =        "1408--1423",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:39 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jun Du and Yanhui Tu and Li-Rong Dai and Chin-Hui
  title =        "A Regression Approach to Single-Channel Speech
                 Separation Via High-Resolution Deep Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "8",
  pages =        "1424--1437",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:39 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xunying Liu and Xie Chen and Yongqiang Wang and Mark
                 J. F. Gales and Philip C. Woodland",
  title =        "Two Efficient Lattice Rescoring Methods Using
                 Recurrent Neural Network Language Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "8",
  pages =        "1438--1449",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:39 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Pawel Swietojanski and Jinyu Li and Steve Renals",
  title =        "Learning Hidden Unit Contributions for Unsupervised
                 Acoustic Model Adaptation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "8",
  pages =        "1450--1463",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:39 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Meng Zhang and Yang Liu and Huanbo Luan and Maosong
  title =        "Listwise Ranking Functions for Statistical Machine
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "8",
  pages =        "1464--1472",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed Jun 8 09:17:39 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1477--1478",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1479--1480",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Daniel C. Cavalieri and Sira E. Palazuelos-Cagigas and
                 Teodiano F. Bastos-Filho and M{\'a}rio
  title =        "Combination of Language Models for Word Prediction: An
                 Exponential Approach",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1481--1494",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ofer Schwartz and Sharon Gannot and Emanu{\"e}l A. P.
  title =        "An Expectation-Maximization Algorithm for
                 Multimicrophone Speech Dereverberation and Noise
                 Reduction With Coherence Matrix Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1495--1510",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Symeon Delikaris-Manias and Juha Vilkamo and Ville
  title =        "Signal-Dependent Spatial Filtering Based on
                 Weighted-Orthogonal Beamformers in the Spherical
                 Harmonic Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1511--1523",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sheng Li and Yuya Akita and Tatsuya Kawahara",
  title =        "Semi-Supervised Acoustic Model Training by
                 Discriminative Data Selection From Multiple {ASR}
                 Systems' Hypotheses",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1524--1534",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Christian Dittmar and Meinard M{\"u}ller",
  title =        "Reverse Engineering the Amen Break --- Score-Informed
                 Separation and Restoration Applied to Drum Recordings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1535--1547",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chao Pan and Jingdong Chen and Jacob Benesty",
  title =        "Reduced-Order Robust Superdirective Beamforming With
                 Uniform Linear Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1548--1559",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Derry FitzGerald and Antoine Liutkus and Roland
  title =        "Projection-Based Demixing of Spatial Audio",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1560--1572",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lin Wang and Joshua D. Reiss and Andrea Cavallaro",
  title =        "Over-Determined Source Separation and Localization
                 Using Distributed Microphones",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1573--1588",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yang Liu and Sujian Li and Furu Wei and Heng Ji",
  title =        "Relation Classification Via Modeling Augmented
                 Dependency Paths",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1589--1598",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Adam Kuklasi{\'n}ski and Simon Doclo and S{\o}ren
                 Holdt Jensen and Jesper Jensen",
  title =        "Maximum Likelihood {PSD} Estimation for Speech
                 Enhancement in Reverberation and Noise",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1599--1612",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sam Karimian-Azari and Jesper Rindom Jensen and Mads
                 Gr{\ae}sb{\o}ll Christensen",
  title =        "Computationally Efficient and Noise Robust {DOA} and
                 Pitch Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1613--1625",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Daichi Kitamura and Nobutaka Ono and Hiroshi Sawada
                 and Hirokazu Kameoka and Hiroshi Saruwatari",
  title =        "Determined Blind Source Separation Unifying
                 Independent Vector Analysis and Nonnegative Matrix
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1626--1641",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Nicolas Obin and Axel Roebel",
  title =        "Similarity Search of Acted Voices for Automatic Voice
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1642--1651",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Aditya Arie Nugraha and Antoine Liutkus and Emmanuel
  title =        "Multichannel Audio Source Separation With Deep Neural
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1652--1664",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Stephen H. Shum and David F. Harwath and Najim Dehak
                 and James R. Glass",
  title =        "On the Use of Acoustic Unit Discovery for Language
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1665--1676",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1677--1678",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1679--1680",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Introducing the {IEEE PES Resource Center}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "1681",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "C1",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "C2",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "C3",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "9",
  pages =        "C4",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1677--1678",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1679--1680",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "James Eaton and Nikolay D. Gaubitch and Alastair H.
                 Moore and Patrick A. Naylor",
  title =        "Estimation of Room Acoustic Parameters: The {ACE}
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1681--1693",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Takashi Nose",
  title =        "Efficient Implementation of Global Variance
                 Compensation for Parametric Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1694--1704",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shabnam Ghaffarzadegan and Hynek Bo{\v{r}}il and John
                 H. L. Hansen",
  title =        "Generative Modeling of Pseudo-Whisper for Robust
                 Whispered Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1705--1720",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Seyedmahdad Mirsamadi and John H. L. Hansen",
  title =        "A Generalized Nonnegative Tensor Factorization
                 Approach for Distant Speech Recognition With
                 Distributed Microphones",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1721--1731",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Laura Fuster and Maria de Diego and Luis A.
                 Azpicueta-Ruiz and Miguel Ferrer",
  title =        "Adaptive Filtered-x Algorithms for Room Equalization
                 Based on Block-Based Combination Schemes",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1732--1745",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kamil Adilo{\u{g}}lu and Emmanuel Vincent",
  title =        "Variational {Bayesian} Inference for Source Separation
                 and Robust Feature Extraction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1746--1758",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Steffen Kortlang and Giso Grimm and Volker Hohmann and
                 Birger Kollmeier and Stephan D. Ewert",
  title =        "Auditory Model-Based Dynamic Compression Controlled by
                 Subband Instantaneous Frequency and Speech Presence
                 Probability Estimates",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1759--1772",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Pawel Swietojanski and Steve Renals",
  title =        "Differentiable Pooling for Unsupervised Acoustic Model
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1773--1784",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kenta Niwa and Yusuke Hioka and Kazunori Kobayashi",
  title =        "Optimal Microphone Array Observation for Clear
                 Recording of Distant Sound Sources",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1785--1795",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Nicolas Epain and Craig T. Jin",
  title =        "Spherical Harmonic Signal Covariance and Sound Field
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1796--1807",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tudor-C{\u{a}}t{\u{a}}lin Zoril{\u{a}} and Yannis
                 Stylianou and Tatsuma Ishihara and Masami Akamine",
  title =        "Near and Far Field Speech-in-Noise Intelligibility
                 Improvements Based on a Time--Frequency Energy
                 Reallocation Approach",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1808--1818",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xi Ma and Dong Wang and Javier Tejedor",
  title =        "Similar Word Model for Unfrequent Word Enhancement in
                 Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1819--1830",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mohammad Hadi Bokaei and Hossein Sameti and Yang Liu",
  title =        "Summarizing Meeting Transcripts Based on Functional
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1831--1841",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiajun Zhang and Yu Zhou and Chengqing Zong",
  title =        "Abstractive Cross-Language Summarization via
                 Translation Model Enhanced Predicate Argument Structure
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1842--1853",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Gr{\'e}goire Lafay and Mathieu Lagrange and Mathias
                 Rossignol and Emmanouil Benetos and Axel Roebel",
  title =        "A Morphological Model for Simulating Acoustic Scenes
                 and Its Application to Sound Event Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1854--1864",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "An Ji and Michael T. Johnson and Jeffrey J. Berry",
  title =        "Parallel Reference Speaker Weighting for
                 Kinematic-Independent Acoustic-to-Articulatory
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1865--1875",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1876--1877",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1878--1879",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Introducing the {IEEE PES Resource Center}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "1880",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "C1",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "C2",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "C3",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "10",
  pages =        "C4",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:17 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "1881--1882",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "1883--1884",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Aggelos Gkiokas and Vassilis Katsouros and George
  title =        "Towards Multi-Purpose Spectral Rhythm Features: An
                 Application to Dance Style, Meter and Tempo
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "1885--1896",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi-Chin Huang and Chung-Hsien Wu and Si-Ting Weng",
  title =        "Improving {Mandarin} Prosody Generation Using
                 Alternative Smoothing Techniques",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "1897--1907",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Asger Heidemann Andersen and Jan Mark de Haan and
                 Zheng-Hua Tan and Jesper Jensen",
  title =        "Predicting the Intelligibility of Noisy and
                 Nonlinearly Processed Binaural Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "1908--1920",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qiaoling Zhang and Zhe Chen and Fuliang Yin",
  title =        "Distributed Marginalized Auxiliary Particle Filter for
                 Speaker Tracking in Distributed Microphone Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "1921--1934",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Marc Ferr{\`a}s and Srikanth Madikeri and Herv{\'e}
  title =        "Speaker Diarization and Linking of Meeting Data",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "1935--1945",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuzong Liu and Katrin Kirchhoff",
  title =        "Graph-Based Semisupervised Learning for Acoustic
                 Modeling in Automatic Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "1946--1956",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jin Wang and Liang-Chih Yu and K. Robert Lai and
                 Xuejie Zhang",
  title =        "Community-Based Weighted Graph Model for
                 Valence-Arousal Prediction of Affective Words",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "1957--1968",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Alberto Carini and Stefania Cecchi and Laura Romoli",
  title =        "Robust Room Impulse Response Measurement Using Perfect
                 Sequences for {Legendre} Nonlinear Filters",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "1969--1982",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sebastian Ewert and Mark Sandler",
  title =        "Piano Transcription in the Studio Using an Extensible
                 Alternating Directions Framework",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "1983--1997",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yu-Ren Chien and Hsin-Min Wang and Shyh-Kang Jeng",
  title =        "Alignment of Lyrics With Accompanied Singing Audio
                 Based on Acoustic-Phonetic Vowel Likelihood Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "1998--2008",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jesper Jensen and Cees H. Taal",
  title =        "An Algorithm for Predicting the Intelligibility of
                 Speech Masked by Modulated Noise Maskers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "2009--2022",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaodong Cui and Vaibhava Goel",
  title =        "Maximum Likelihood Nonlinear Transformations Based on
                 Deep Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "2023--2031",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  note =         "See correction \cite{Kuklasinski:2017:CTM}.",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Toru Nakashika and Tetsuya Takiguchi and Yasuhiro
  title =        "Non-Parallel Training in Voice Conversion Using an
                 Adaptive Restricted {Boltzmann} Machine",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "2032--2045",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "I-Bin Liao and Chen-Yu Chiang and Yih-Ru Wang and
                 Sin-Horng Chen",
  title =        "Speaker Adaptation of {SR-HPM} for Speaking
                 Rate-Controlled {Mandarin} {TTS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "2046--2058",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hiroki Ouchi and Kevin Duh and Hiroyuki Shindo and
                 Yuji Matsumoto",
  title =        "Transition-Based Dependency Parsing Exploiting
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "2059--2068",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tong Xiao and Derek F. Wong and Jingbo Zhu",
  title =        "A Loss-Augmented Approach to Training Syntactic
                 Machine Translation Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "2069--2083",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yukara Ikemiya and Katsutoshi Itoyama and Kazuyoshi
  title =        "Singing Voice Separation and Vocal {F0} Estimation
                 Based on Mutual Combination of Robust Principal
                 Component Analysis and Subharmonic Summation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "2084--2095",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Siddharth Sigtia and Adam M. Stark and Sacha
                 Krstulovi{\'c} and Mark D. Plumbley",
  title =        "Automatic Environmental Sound Recognition: Performance
                 Versus Computational Cost",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "2096--2107",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Srinivas Parthasarathy and Roddy Cowie and Carlos
  title =        "Using Agreement on Direction of Change to Build
                 Rank-Based Emotion Classifiers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "2108--2121",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jia-Ching Wang and Yuan-Shan Lee and Chang-Hong Lin
                 and Shu-Fan Wang and Chih-Hao Shih and Chung-Hsien Wu",
  title =        "Compressive Sensing-Based Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "2122--2131",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Siying Wang and Sebastian Ewert and Simon Dixon",
  title =        "Robust and Efficient Joint Alignment of Multiple
                 Musical Performances",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "2132--2145",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xie Chen and Xunying Liu and Yongqiang Wang and Mark
                 J. F. Gales and Philip C. Woodland",
  title =        "Efficient Training and Evaluation of Recurrent Neural
                 Network Language Models for Automatic Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "2146--2157",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ping-Keng Jao and Li Su and Yi-Hsuan Yang and Brendt
  title =        "Monaural Music Source Separation Using Convolutional
                 Sparse Coding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "11",
  pages =        "2158--2170",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Andrea Cogliati and Zhiyao Duan and Brendt Wohlberg",
  title =        "Context-Dependent Piano Music Transcription With
                 Convolutional Sparse Coding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2218--2230",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yanmin Qian and Tian Tan and Dong Yu",
  title =        "Neural Network Based Multi-Factor Aware Joint Training
                 for Robust Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2231--2240",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lahiru Samarakoon and Khe Chai Sim",
  title =        "Factorized Hidden Layer Adaptation for Deep Neural
                 Network Based Acoustic Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2241--2250",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Martin Krawczyk-Becker and Timo Gerkmann",
  title =        "On {MMSE}-Based Estimation of Amplitude and Complex
                 Speech Spectral Coefficients Under Phase-Uncertainty",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2251--2262",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yanmin Qian and Mengxiao Bi and Tian Tan and Kai Yu",
  title =        "Very Deep Convolutional Neural Networks for Noise
                 Robust Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2263--2276",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi-Chan Wu and Homer H. Chen",
  title =        "Generation of Affective Accompaniment in Accordance
                 With Emotion Flow",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2277--2287",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mahmood Movassagh and Peter Kabal",
  title =        "Scalable Audio Coding Using {Trellis}-Based Optimized
                 Joint Entropy Coding and Quantization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2288--2300",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Milos Cernak and Alexandros Lazaridis and Afsaneh
                 Asaei and Philip N. Garner",
  title =        "Composition of Deep and Spiking Neural Networks for
                 Very Low Bit Rate Speech Coding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2301--2312",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "David Dov and Ronen Talmon and Israel Cohen",
  title =        "Kernel Method for Voice Activity Detection in the
                 Presence of Transients",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2313--2326",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jes{\'u}s Villalba and Antonio Miguel and Alfonso
                 Ortega and Eduardo Lleida",
  title =        "{Bayesian} Networks to Model the Variability of
                 Speaker Verification Scores in Adverse Environments",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2327--2340",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hardik B. Sailor and Hemant A. Patil",
  title =        "Novel Unsupervised Auditory Filterbank Learning Using
                 Convolutional {RBM} for Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2341--2353",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sidsel Marie N{\o}rholm and Jesper Rindom Jensen and
                 Mads Gr{\ae}sb{\o}ll Christensen",
  title =        "Instantaneous Fundamental Frequency Estimation With
                 Optimal Segmentation for Nonstationary Voiced Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2354--2367",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sheng Zhang and Jiashu Zhang and Hongyu Han",
  title =        "Robust Variable Step-Size Decorrelation Normalized
                 Least-Mean-Square Algorithm and its Application to
                 Acoustic Echo Cancellation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2368--2376",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tom Barker and Tuomas Virtanen",
  title =        "Blind Separation of Audio Mixtures Through Nonnegative
                 Tensor Factorization of Modulation Spectrograms",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2377--2389",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jinxin Liu and Xuefeng Chen",
  title =        "Adaptive Compensation of Misequalization in Narrowband
                 Active Noise Equalizer Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2390--2399",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Atsunori Ogawa and Takaaki Hori and Atsushi Nakamura",
  title =        "Estimating Speech Recognition Accuracy Based on Error
                 Type Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2400--2413",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Finnian Kelly and John H. L. Hansen",
  title =        "Score-Aging Calibration for Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2414--2424",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bochen Li and Zhiyao Duan",
  title =        "An Approach to Score Following for Piano Performances
                 With the Sustained Effect",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2425--2438",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Niko Moritz and Birger Kollmeier and J{\"o}rn
  title =        "Integration of Optimized Modulation Filter Sets Into
                 Deep Neural Networks for Automatic Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2439--2452",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Simon Leglaive and Roland Badeau and Ga{\"e}l
  title =        "Multichannel Audio Source Separation With
                 Probabilistic Reverberation Priors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2453--2465",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sakari Tervo",
  title =        "Single Snapshot Detection and Estimation of
                 Reflections From Room Impulse Responses in the
                 Spherical Harmonic Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2466--2480",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dejan Markovi{\'c} and Fabio Antonacci and Lucio
                 Bianchi and Stefano Tubaro and Augusto Sarti",
  title =        "Extraction of Acoustic Sources Through the Processing
                 of Sound Field Maps in the Ray Space",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "24",
  number =       "12",
  pages =        "2481--2494",
  month =        "????",
  year =         "2016",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Tue Oct 25 08:43:18 MDT 2016",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "222--223",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "224--225",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hanchi Chen and Thushara Dheemantha Abhayapala and
                 Prasanga N. Samarasinghe and Wen Zhang",
  title =        "Direct-to-Reverberant Energy Ratio Estimation Using a
                 First-Order Microphone",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "226--237",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Peter Bell and Pawel Swietojanski and Steve Renals",
  title =        "Multitask Learning of Context-Dependent Targets in
                 Deep Neural Network Acoustic Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "238--247",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rui Zhao and Kezhi Mao",
  title =        "Topic-Aware Deep Compositional Models for Sentence
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "248--260",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dalia {El Badawy} and Ngoc Q. K. Duong and Alexey
  title =        "On-the-Fly Audio Source Separation --- A Novel
                 User-Friendly Framework",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "261--272",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Filip Elvander and Johan Sw{\"a}rd and Andreas
  title =        "Online Estimation of Multiple Harmonic Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "273--284",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Vincent Renkens and Hugo {Van hamme}",
  title =        "Weakly Supervised Learning of Hidden {Markov} Models
                 for Spoken Language Acquisition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "285--295",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Luca Remaggi and Philip J. B. Jackson and Philip
                 Coleman and Wenwu Wang",
  title =        "Acoustic Reflector Localization: Novel Image Source
                 Reversion and Direct Localization Methods",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "296--309",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Prasanga N. Samarasinghe and Thushara D. Abhayapala
                 and Hanchi Chen",
  title =        "Estimating the Direct-to-Reverberant Energy Ratio
                 Using a Spherical Harmonics-Based Spatial Correlation
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "310--319",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shmulik Markovich-Golan and Sharon Gannot and Walter
  title =        "Combined {LCMV-TRINICON} Beamforming for Separating
                 Multiple Speech Sources in Noisy and Reverberant
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "320--332",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shakeel Ahmed and Muhammad Tahir Akhtar",
  title =        "Gain Scheduling of Auxiliary Noise and Variable
                 Step-Size for Online Acoustic Feedback Cancellation in
                 Narrow-Band Active Noise Control Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "333--343",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Gabriel Sargent and Fr{\'e}d{\'e}ric Bimbot and
                 Emmanuel Vincent",
  title =        "Estimating the Structural Segmentation of Popular
                 Music Pieces Under Regularity Constraints",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "344--358",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jordan Cheer and Stephen Daley",
  title =        "An Investigation of Delayless Subband Adaptive
                 Filtering for Multi-Input Multi-Output Active Noise
                 Control Applications",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "359--373",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sebastian J. Schlecht and Emanu{\"e}l A. P. Habets",
  title =        "Feedback Delay Networks: Echo Density and Mixing
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "374--383",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Johannes Abel and Magdalena Kaniewska and Cyril
                 Guillaum{\'e} and Wouter Tirry and Tim Fingscheidt",
  title =        "An Instrumental Quality Measure for Artificially
                 Bandwidth-Extended Speech Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "384--396",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Robert Rehr and Timo Gerkmann",
  title =        "An Analysis of Adaptive Recursive Smoothing with
                 Applications to Noise {PSD} Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "397--408",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Emilio Granell and Carlos-D. Mart{\'\i}nez-Hinarejos",
  title =        "Multimodal Crowdsourcing for Transcribing Handwritten
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "409--419",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yaping Ma and Yegui Xiao",
  title =        "A New Strategy for Online Secondary-Path Modeling of
                 Narrowband Active Noise Control",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "420--434",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jose A. Belloch and Alberto Gonzalez and Enrique S.
                 Quintana-Ort{\'\i} and Miguel Ferrer and Vesa
  title =        "{GPU}-Based Dynamic Wave Field Synthesis Using
                 Fractional Delay Filters and Room Compensation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "435--447",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "448--449",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE} Transactions on Multimedia information for
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "450--451",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Introducing {IEEE Collabratec}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "452",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "C1",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "2",
  pages =        "C2",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "3--4",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:46 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "3--4",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:46 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "3--4",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "3--4",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qi He and Feng Bao and Changchun Bao",
  title =        "Multiplicative Update of Auto-Regressive Gains for
                 Codebook-Based Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "457--468",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhongqing Wang and Sophia Yat Mei Lee and Shoushan Li
                 and Guodong Zhou",
  title =        "Emotion Analysis in Code-Switching Text With Joint
                 Factor Graph Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "469--480",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ashwin Bellur and Mounya Elhilali",
  title =        "Feedback-Driven Sensory Mapping Adaptation for Robust
                 Speech Activity Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "481--492",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhiyuan Tang and Lantian Li and Dong Wang and
                 Ravichander Vipperla",
  title =        "Collaborative Joint Training With Multitask Recurrent
                 Model for Speech and Speaker Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "493--504",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bidisha Sharma and S. R. Mahadeva Prasanna",
  title =        "Sonority Measurement Using System, Source, and
                 Suprasegmental Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "505--518",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hung-Yi Lee and Bo-Hsiang Tseng and Tsung-Hsien Wen
                 and Yu Tsao",
  title =        "Personalizing Recurrent-Neural-Network-Based Language
                 Model by Social Network",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "519--530",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ji Ming and Danny Crookes",
  title =        "Speech Enhancement Based on Full-Sentence Correlation
                 and Clean Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "531--543",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Quoc Truong Do and Tomoki Toda and Graham Neubig and
                 Sakriani Sakti and Satoshi Nakamura",
  title =        "Preserving Word-Level Emphasis in Speech-to-Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "544--556",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhenghua Li and Jiayuan Chao and Min Zhang and
                 Wenliang Chen and Meishan Zhang and Guohong Fu",
  title =        "Coupled {POS} Tagging on Heterogeneous Annotations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "557--571",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Clement S. J. Doire and Mike Brookes and Patrick A.
                 Naylor and Christopher M. Hicks and Dave Betts and
                 Mohammad A. Dmour and S{\o}ren Holdt Jensen",
  title =        "Single-Channel Online Enhancement of Speech Corrupted
                 by Reverberation and Noise",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "572--587",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Aleksandr Sizov and Kong Aik Lee and Tomi Kinnunen",
  title =        "Direct Optimization of the Detection Cost for
                 {$I$}-Vector-Based Spoken Language Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "588--597",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Imran Sheikh and Dominique Fohr and Irina Illina and
                 Georges Linar{\`e}s",
  title =        "Modelling Semantic Context of {OOV} Words in Large
                 Vocabulary Continuous Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "598--610",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mojtaba Farmani and Michael Syskind Pedersen and
                 Zheng-Hua Tan and Jesper Jensen",
  title =        "Informed Sound Source Localization Using Relative
                 Transfer Functions for Hearing Aid Applications",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "611--623",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "C. M. Vikram and S. R. Mahadeva Prasanna",
  title =        "Epoch Extraction From Telephone Quality Speech Using
                 Single Pole Filter",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "624--636",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Motoi Omachi and Tetsuji Ogawa and Tetsunori
  title =        "Associative Memory Model-Based Linear Filtering and
                 Its Application to Tandem Connectionist Blind Source
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "637--650",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dani Cherkassky and Sharon Gannot",
  title =        "Blind Synchronization in Wireless Acoustic Sensor
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "651--661",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Laurent Girin and Thomas Hueber and Xavier
  title =        "Extending the Cascaded {Gaussian} Mixture Regression
                 Framework for Cross-Speaker Acoustic-Articulatory
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "662--673",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mohamad Hasan Bahari and Alexander Bertrand and Marc
  title =        "Blind Sampling Rate Offset Estimation for Wireless
                 Acoustic Sensor Networks Through Weighted Least-Squares
                 Coherence Drift Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "674--686",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Adam Kuklasi{\'n}ski and Simon Doclo and S{\o}ren
                 Holdt Jensen and Jesper Jensen",
  title =        "Correction to {``Maximum Likelihood PSD Estimation for
                 Speech Enhancement in Reverberation and Noise''}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "3",
  pages =        "687--687",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Feb 25 09:40:47 MST 2017",
  bibsource =    "",
  note =         "See \cite{Cui:2016:MLN}.",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "688--689",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "690--691",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sharon Gannot and Emmanuel Vincent and Shmulik
                 Markovich-Golan and Alexey Ozerov",
  title =        "A Consolidated Perspective on Multimicrophone Speech
                 Enhancement and Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "692--730",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dongwen Ying and Ruohua Zhou and Junfeng Li and
                 Yonghong Yan",
  title =        "Window-Dominant Signal Subspace Methods for Multiple
                 Short-Term Speech Source Localization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "731--744",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sean U. N. Wood and Jean Rouat and St{\'e}phane Dupont
                 and Gueorgui Pironkov",
  title =        "Blind Speech Separation and Enhancement With
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "745--755",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Constantin Spille and Birger Kollmeier and Bernd T.
  title =        "Combining Binaural and Cortical Features for Robust
                 Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "756--767",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuma Koizumi and Kenta Niwa and Yusuke Hioka and
                 Kazunori Kobayashi and Hitoshi Ohmuro",
  title =        "Informative Acoustic Feature Selection to Maximize
                 Mutual Information for Collecting Target Sources",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "768--779",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Takuya Higuchi and Nobutaka Ito and Shoko Araki and
                 Takuya Yoshioka and Marc Delcroix and Tomohiro
  title =        "Online {MVDR} Beamformer Based on Complex {Gaussian}
                 Mixture Model With Spatial Prior for Noise Robust
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "780--793",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Eita Nakamura and Kazuyoshi Yoshii and Shigeki
  title =        "Rhythm Transcription of Polyphonic Piano Music Based
                 on Merged-Output {HMM} for Multiple Voices",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "794--806",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Omid Ghahabi and Javier Hernando",
  title =        "Deep Learning Backend for Single and Multisession
                 $i$-Vector Speaker Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "807--817",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Penny Karanasou and Chunyang Wu and Mark Gales and
                 Philip C. Woodland",
  title =        "{$I$}-Vectors and Structured Neural Networks for Rapid
                 Adaptation of Acoustic Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "818--828",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "G. Aneeja and B. Yegnanarayana",
  title =        "Extraction of Fundamental Frequency From Degraded
                 Speech Using Temporal Envelopes at High {SNR}
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "829--838",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Seyyed Saeed Sarfjoo and Cenk Demiro{\u{g}}lu and
                 Simon King",
  title =        "Using Eigenvoices and Nearest-Neighbors in {HMM}-Based
                 Cross-Lingual Speaker Adaptation With Limited Data",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "839--851",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yung-Yue Chen and Jia-Hao Zhang",
  title =        "Background Noise Reduction Design for Dual Microphone
                 Cellular Phones: Robust Approach",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "852--862",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Liner Yang and Xinxiong Chen and Zhiyuan Liu and
                 Maosong Sun",
  title =        "Improving Word Representations with Document Labels",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "863--870",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shiliang Zhang and Cong Liu and Hui Jiang and Si Wei
                 and Lirong Dai and Yu Hu",
  title =        "Nonrecurrent Neural Structure for Long-Term
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "871--884",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xuefeng Yang and Kezhi Mao",
  title =        "Task Independent Fine Tuning for Word Embeddings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "885--894",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yu Bao and Huawei Chen",
  title =        "Design of Robust Broadband Beamformers Using
                 Worst-Case Performance Optimization: a Semidefinite
                 Programming Approach",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "895--907",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sandro Cumani and Pietro Laface",
  title =        "Nonlinear {I}-Vector Transformations for {PLDA}-Based
                 Speaker Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "908--919",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE\slash} {ACM} Transactions on Audio, Speech, and
                 Language Processing Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "920--921",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE} Transactions on Audio, Speech, and Language
                 Processing information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "922--923",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Introducing {IEEE Collabratec}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "924",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "C1",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "C2",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "C3",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "4",
  pages =        "C4",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Mon Jul 24 18:45:09 MDT 2017",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "925--926",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "927--928",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Manu Airaksinen and Tom B{\"a}ckstr{\"o}m and Paavo
  title =        "Quadratic Programming Approach to Glottal Inverse
                 Filtering by Joint Norm-1 and Norm-2 Optimization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "929--939",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Ofer Schwartz and Sharon Gannot and Emanu{\"e}l A. P.
  title =        "Multispeaker {LCMV} Beamformer and Postfilter for
                 Source Separation and Noise Reduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "940--951",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Dongmei Wang and Chengzhu Yu and John H. L. Hansen",
  title =        "Robust Harmonic Features for Classification-Based
                 Pitch Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "952--964",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Tara N. Sainath and Ron J. Weiss and Kevin W. Wilson
                 and Bo Li and Arun Narayanan and Ehsan Variani and
                 Michiel Bacchiani and Izhak Shafran and Andrew Senior
                 and Kean Chin and Ananya Misra and Chanwoo Kim",
  title =        "Multichannel Signal Processing With Deep Neural
                 Networks for Automatic Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "965--979",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Hanieh Khalilian and Ivan V. Baji{\'c} and Rodney G.
  title =        "A Simulation Study of a Three-Dimensional Sound Field
                 Reproduction System for Immersive Communication",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "980--995",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Andreas Franck and Wenwu Wang and Filippo Maria Fazi",
  title =        "Sparse $ \ell_1$-Optimal Multiloudspeaker Panning and
                 Its Relation to Vector Base Amplitude Panning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "996--1010",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Songbin Li and Yizhen Jia and C.-C. Jay Kuo",
  title =        "Steganalysis of {QIM} Steganography in Low-Bit-Rate
                 Speech Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1011--1022",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Naoyuki Kanda and Xugang Lu and Hisashi Kawai",
  title =        "Maximum-a-Posteriori-Based Decoding for End-to-End
                 Acoustic Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1023--1034",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Navid Shokouhi and John H. L. Hansen",
  title =        "{Teager--Kaiser} Energy Operators for Overlapped
                 Speech Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1035--1047",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Yi-Chin Huang and Chung-Hsien Wu and Yan-You Chen and
                 Ming-Ge Shie and Jhing-Fa Wang",
  title =        "Personalized Spontaneous Speech Synthesis Using a
                 Small-Sized Unsegmented Semispontaneous Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1048--1060",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Jeongsoo Park and Jaeyoung Shin and Kyogu Lee",
  title =        "Exploiting Continuity\slash Discontinuity of Basis
                 Vectors in Spectrogram Decomposition for
                 Harmonic-Percussive Sound Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1061--1074",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Xueliang Zhang and DeLiang Wang",
  title =        "Deep Learning Based Binaural Speech Separation in
                 Reverberant Environments",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1075--1084",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Masood Delfarah and DeLiang Wang",
  title =        "Features for Masking-Based Monaural Speech Separation
                 in Reverberant Conditions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1085--1094",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Feiran Yang and Gerald Enzner and Jun Yang",
  title =        "Statistical Convergence Analysis for Optimal Control
                 of {DFT}-Domain Adaptive Echo Canceler",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1095--1106",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Takashi Nose and Yusuke Arao and Takao Kobayashi and
                 Komei Sugiura and Yoshinori Shiga",
  title =        "Sentence Selection Based on Extended Entropy Using
                 Phonetic and Prosodic Contexts for Statistical
                 Parametric Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1107--1116",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Gergely Firtha and P{\'e}ter Fiala and Frank Schultz
                 and Sascha Spors",
  title =        "Improved Referencing Schemes for {2.5D} Wave Field
                 Synthesis Driving Functions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1117--1127",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Esteban Maestre and Gary P. Scavone and Julius O.
  title =        "Joint Modeling of Bridge Admittance and Body
                 Radiativity for Efficient Synthesis of String
                 Instrument Sound by Digital Waveguides",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1128--1139",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Gongping Huang and Jacob Benesty and Jingdong Chen",
  title =        "On the Design of Frequency-Invariant Beampatterns With
                 Uniform Circular Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1140--1153",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Zden{\v{e}}k Pr{\r{u}}{\v{s}}a and Peter Balazs and
                 Peter Lempel S{\o}ndergaard",
  title =        "A Noniterative Method for Reconstruction of Phase From
                 {STFT} Magnitude",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1154--1164",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1167--1168",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1169--1170",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1171",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Introducing {IEEE Collabratec}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1172",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{Member Get-A-Member (MGM) Program}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "1173",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank Page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "B1165--B1166",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "C1",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "C2",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "C3",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "5",
  pages =        "C4",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1167--1168",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "G. Richard and T. Virtanen and J. P. Bello and N. Ono
                 and H. Glotin",
  title =        "Introduction to the Special Section on Sound Scene and
                 Event Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1169--1171",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "H{\'e}ctor A. S{\'a}nchez-Hevia and David Ayll{\'o}n
                 and Roberto Gil-Pita and Manuel Rosa-Zurera",
  title =        "Maximum Likelihood Decision Fusion for Weapon
                 Classification in Wireless Acoustic Sensor Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1172--1182",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Nithin Rao Koluguri and G. Nisha Meenakshi and
                 Prasanta Kumar Ghosh",
  title =        "Spectrogram Enhancement Using {Multiple Window
                 Savitzky--Golay (MWSG)} Filter for Robust Bird Sound
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1183--1192",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Dan Stowell and Emmanouil Benetos and Lisa F. Gill",
  title =        "On-Bird Sound Recordings: Automatic Acoustic
                 Recognition of Activities and Contexts",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1193--1206",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Brandon T. Carroll and Bradley M. Whitaker and Wayne
                 Dayley and David V. Anderson",
  title =        "Outlier Learning via Augmented Frozen Dictionaries",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1207--1215",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Victor Bisot and Romain Serizel and Slim Essid and
                 Ga{\"e}l Richard",
  title =        "Feature Learning With Matrix Factorization Applied to
                 Acoustic Scene Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1216--1229",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Yong Xu and Qiang Huang and Wenwu Wang and Peter
                 Foster and Siddharth Sigtia and Philip J. B. Jackson
                 and Mark D. Plumbley",
  title =        "Unsupervised Feature Learning Based on Deep Models for
                 Environmental Audio Tagging",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1230--1241",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Ren{\'e} Grzeszick and Axel Plinge and Gernot A.
  title =        "Bag-of-Features Methods for Acoustic Event Detection
                 and Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1242--1252",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Alain Rakotomamonjy",
  title =        "Supervised Representation Learning for Audio Scene
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1253--1265",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Emmanouil Benetos and Gr{\'e}goire Lafay and Mathieu
                 Lagrange and Mark D. Plumbley",
  title =        "Polyphonic Sound Event Tracking Using Linear Dynamical
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1266--1277",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Huy Phan and Lars Hertel and Marco Maass and Philipp
                 Koch and Radoslaw Mazur and Alfred Mertins",
  title =        "Improved Audio Scene Classification Based on
                 Label-Tree Embeddings and Convolutional Neural
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1278--1290",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Emre {\c{C}}ak\i r and Giambattista Parascandolo and
                 Toni Heittola and Heikki Huttunen and Tuomas Virtanen",
  title =        "Convolutional Recurrent Neural Networks for Polyphonic
                 Sound Event Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1291--1303",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Jens Schr{\"o}der and Niko Moritz and J{\"o}rn
                 Anem{\"u}ller and Stefan Goetze and Birger Kollmeier",
  title =        "Classifier Architectures for Acoustic Scenes and
                 Events: Implications for {DNNs}, {TDNNs}, and
                 Perceptual Features from {DCASE} 2016",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1304--1314",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Wenjun Yang and Sridhar Krishnan",
  title =        "Combining Temporal Features by Local Binary Pattern
                 for Acoustic Scene Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1315--1321",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "David Dov and Ronen Talmon and Israel Cohen",
  title =        "Multimodal Kernel Method for Activity Detection of
                 Sound Sources",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1322--1334",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Keisuke Imoto and Nobutaka Ono",
  title =        "Spatial Cepstrum as a Spatial Feature Using a
                 Distributed Microphone Array for Acoustic Scene
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1335--1343",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Ivo Trowitzsch and Johannes Mohr and Youssef Kashef
                 and Klaus Obermayer",
  title =        "Robust Detection of Environmental Sounds in Binaural
                 Auditory Scenes",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1344--1356",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Abu Shafin Mohammad Mahdee Jameel and Shaikh Anowarul
                 Fattah and Rajib Goswami and Wei-Ping Zhu and M. Omair
  title =        "Noise Robust Formant Frequency Estimation Method Based
                 on Spectral Model of Repeated Autocorrelation of
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1357--1370",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Na Li and Man-Wai Mak and Jen-Tzung Chien",
  title =        "{DNN}-Driven Mixture of {PLDA} for Robust Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1371--1383",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Kai Wu and Vaninirappuputhenpurayil Gopalan Reju and
                 Andy W. H. Khong and Shu Ting Goh",
  title =        "Swarm Intelligence Based Particle Filter for
                 Alternating Talker Localization and Tracking Using
                 Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1384--1397",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1398--1399",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1400--1401",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1402",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Introducing {IEEE Collabratec}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1403",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{Member Get-A-Member (MGM) Program}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "1404",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "C1",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "C2",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "C3",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "6",
  pages =        "C4",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1405--1406",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1407--1408",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Yu-An Chen and Ju-Chiang Wang and Yi-Hsuan Yang and
                 Homer H. Chen",
  title =        "Component Tying for Mixture Model Adaptation in
                 Personalization of Music Emotion Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1409--1420",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Hossein Zeinali and Hossein Sameti and Luk{\'a}{\v{s}}
  title =        "{HMM}-Based Phrase-Independent $i$-Vector Extractor
                 for Text-Dependent Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1421--1435",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Xinzhou Xu and Jun Deng and Nicholas Cummins and
                 Zixing Zhang and Chen Wu and Li Zhao and Bj{\"o}rn
  title =        "A Two-Dimensional Framework of Multiple Kernel
                 Subspace Learning for Recognizing Emotion in Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1436--1449",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Mandy Korpusik and James Glass",
  title =        "Spoken Language Understanding for a Nutrition Dialogue
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1450--1461",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Mahmoud Fakhry and Piergiorgio Svaizer and Maurizio
  title =        "Audio Source Separation in Reverberant Environments
                 Using $ \beta $-Divergence-Based Nonnegative
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1462--1476",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Bracha Laufer-Goldshtein and Ronen Talmon and Sharon
  title =        "Semi-Supervised Source Localization on Multiple
                 Manifolds With Distributed Microphones",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1477--1491",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Donald S. Williamson and DeLiang Wang",
  title =        "Time-Frequency Masking in the Complex Domain for
                 Speech Dereverberation and Denoising",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1492--1501",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Liang Lu and Steve Renals",
  title =        "Small-Footprint Highway Deep Neural Networks for
                 Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1502--1511",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Ina Kodrasi and Simon Doclo",
  title =        "Signal-Dependent Penalty Functions for Robust Acoustic
                 Multi-Channel Equalization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1512--1525",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Jung-Hee Kim and Jin Kim and Jae Hyeon Jeon and Sang
                 Won Nam",
  title =        "Delayless Individual-Weighting-Factors Sign Subband
                 Adaptive Filter With Band-Dependent Variable
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1526--1534",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Yannan Wang and Jun Du and Li-Rong Dai and Chin-Hui
  title =        "A Gender Mixture Detection Approach to Unsupervised
                 Single-Channel Speech Separation Based on Deep Neural
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1535--1546",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Giacomo Vairetti and Enzo {De Sena} and Michael
                 Catrysse and S{\o}ren Holdt Jensen and Marc Moonen and
                 Toon van Waterschoot",
  title =        "A Scalable Algorithm for Physically Motivated and
                 Sparse Approximation of Room Impulse Responses With
                 Orthonormal Basis Functions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1547--1561",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1562--1563",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1564--1565",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1566",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Introducing {IEEE Collabratec}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "1567",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "C1",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "C2",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "C3",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "7",
  pages =        "C4",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:30 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1562--1563",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1564--1565",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Francis Stevens and Damian T. Murphy and Lauri Savioja
                 and Vesa V{\"a}lim{\"a}ki",
  title =        "Modeling Sparsely Reflecting Outdoor Acoustic Scenes
                 Using the Waveguide {Web}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1566--1578",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Ferdinando Olivieri and Filippo Maria Fazi and Simone
                 Fontana and Dylan Menzies and Philip Arthur Nelson",
  title =        "Generation of Private Sound With a Circular
                 Loudspeaker Array and the Weighted Pressure Matching
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1579--1591",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Samy Elshamy and Nilesh Madhu and Wouter Tirry and Tim
  title =        "Instantaneous A Priori {SNR} Estimation by Cepstral
                 Excitation Manipulation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1592--1605",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Paavo Alku and Rahim Saeidi",
  title =        "The Linear Predictive Modeling of Speech From
                 Higher-Lag Autocorrelation Coefficients Applied to
                 Noise-Robust Speaker Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1606--1617",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Cheng Pang and Hong Liu and Jie Zhang and Xiaofei Li",
  title =        "Binaural Sound Localization Based on Reverberation
                 Weighting and Generalized Parametric Mapping",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1618--1632",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Somanath Pradhan and Vinal Patel and Dipen Somani and
                 Nithin V. George",
  title =        "An Improved Proportionate Delayless
                 Multiband-Structured Subband Adaptive Feedback
                 Canceller for Digital Hearing Aids",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1633--1643",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Szymon Drgas and Tuomas Virtanen and J{\"o}rg
                 L{\"u}cke and Antti Hurmalainen",
  title =        "Binary Non-Negative Matrix Deconvolution for Audio
                 Dictionary Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1644--1656",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Fatemeh Saki and Nasser Kehtarnavaz",
  title =        "Real-Time Unsupervised Classification of Environmental
                 Noise Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1657--1667",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Lakshmish Kaushik and Abhijeet Sangwan and John H. L.
  title =        "Automatic Sentiment Detection in Naturalistic Audio",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1668--1679",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Ofer Schwartz and Sharon Gannot and Emanu{\"e}l A. P.
  title =        "{Cram{\'e}r--Rao} Bound Analysis of Reverberation
                 Level Estimators for Dereverberation and Noise
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1680--1693",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Seyran Khademi and Richard C. Hendriks and W. Bastiaan
  title =        "Intelligibility Enhancement Based on Mutual
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1694--1708",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Yuta Hatano and Chuang Shi and Yoshinobu Kajikawa",
  title =        "Compensation for Nonlinear Distortion of the Frequency
                 Modulation-Based Parametric Array Loudspeaker",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1709--1717",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Yu-Ren Chien and Daryush D. Mehta and J{\'o}n
                 Gu{\eth}nason and Mat{\'\i}as Za{\~n}artu and Thomas F.
  title =        "Evaluation of Glottal Inverse Filtering Algorithms
                 Using a Physiologically Based Articulatory Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1718--1730",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1731--1732",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1733--1734",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1735",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Introducing {IEEE Collabratec}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "1736",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "C1",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "C2",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "C3",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "8",
  pages =        "C4",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1737--1738",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1739--1740",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Jakob Abe{\ss}er and Gerald Schuller",
  title =        "Instrument-Centered Music Transcription of Solo Bass
                 Guitar Recordings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1741--1750",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Thomas {Le Cornu} and Ben Milner",
  title =        "Generating Intelligible Audio Speech From Visual
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1751--1761",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Lemao Liu and Atsushi Fujita and Masao Utiyama and
                 Andrew Finch and Eiichiro Sumita",
  title =        "Translation Quality Estimation Using Only Bilingual
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1762--1772",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Emad M. Grais and Gerard Roma and Andrew J. R. Simpson
                 and Mark D. Plumbley",
  title =        "Two-Stage Single-Channel Audio Source Separation Using
                 Deep Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1773--1783",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Giuliano Bernardi and Toon van Waterschoot and Jan
                 Wouters and Marc Moonen",
  title =        "Adaptive Feedback Cancellation Using a
                 Partitioned-Block Frequency-Domain {Kalman} Filter
                 Approach With {PEM}-Based Signal Prewhitening",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1784--1798",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Vinal Patel and Jordan Cheer and Nithin V. George",
  title =        "Modified Phase-Scheduled-Command {FxLMS} Algorithm for
                 Active Sound Profiling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1799--1808",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Killian Janod and Mohamed Morchid and Richard Dufour
                 and Georges Linar{\`e}s and Renato {De Mori}",
  title =        "Denoised Bottleneck Features From Deep Autoencoders
                 for Telephone Conversation Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1809--1820",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Nikolaos Stefanakis and Despoina Pavlidi and
                 Athanasios Mouchtaris",
  title =        "Perpendicular Cross-Spectra Fusion for Sound Source
                 Localization With a Planar Microphone Array",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1821--1835",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  note =         "See corrections \cite{Stefanakis:2017:CPC}.",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Takenori Yoshimura and Kei Hashimoto and Keiichiro
                 Oura and Yoshihiko Nankaku and Keiichi Tokuda",
  title =        "Simultaneous Optimization of Multiple Tree-Based
                 Factor Analyzed {HMM} for Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1836--1845",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Eita Nakamura and Kazuyoshi Yoshii and Simon Dixon",
  title =        "Note Value Recognition for Piano Transcription Using
                 {Markov} Random Fields",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1846--1858",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1859--1860",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1861--1862",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "1863",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "C1",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "C2",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "C3",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "9",
  pages =        "C4",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:31 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "1859--1860",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "1861--1862",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Xiaohai Tian and Siu Wa Lee and Zhizheng Wu and Eng
                 Siong Chng and Haizhou Li",
  title =        "An Exemplar-Based Approach to Frequency Warping for
                 Voice Conversion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "1863--1876",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Siying Wang and Sebastian Ewert and Simon Dixon",
  title =        "Identifying Missing and Extra Notes in Piano
                 Recordings Using Score-Informed Dictionary Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "1877--1889",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Sandro Cumani and Pietro Laface",
  title =        "Joint Estimation of {PLDA} and Nonlinear
                 Transformations of Speaker Vectors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "1890--1900",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Morten Kolb{\ae}k and Dong Yu and Zheng-Hua Tan and
                 Jesper Jensen",
  title =        "Multitalker Speech Separation With Utterance-Level
                 Permutation Invariant Training of Deep Recurrent Neural
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "1901--1913",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Cheng-Tao Chung and Cheng-Yu Tsai and Chia-Hsiang Liu
                 and Lin-Shan Lee",
  title =        "Unsupervised Iterative Deep Learning of Speech
                 Features and Acoustic Tokens with Applications to
                 Spoken Term Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "1914--1928",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Niccol{\`o} Antonello and Enzo {De Sena} and Marc
                 Moonen and Patrick A. Naylor and Toon van Waterschoot",
  title =        "Room Impulse Response Interpolation Using a Sparse
                 Spatio-Temporal Representation of the Sound Field",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "1929--1941",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Yanmin Qian and Nanxin Chen and Heinrich Dinkel and
                 Zhizheng Wu",
  title =        "Deep Feature Engineering for Noise Robust Spoofing
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "1942--1955",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Sina Hafezi and Alastair H. Moore and Patrick A.
  title =        "Augmented Intensity Vectors for Direction of Arrival
                 Estimation in the Spherical Harmonic Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "1956--1968",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Byeongho Jo and Jung-Woo Choi",
  title =        "Spherical Harmonic Smoothing for Localizing Coherent
                 Sound Sources",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "1969--1984",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Emma Jokinen and Ulpu Remes and Paavo Alku",
  title =        "Intelligibility Enhancement of Telephone Speech Using
                 {Gaussian} Process Regression for Normal-to-Lombard
                 Spectral Tilt Conversion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "1985--1996",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Xiaofei Li and Laurent Girin and Radu Horaud and
                 Sharon Gannot",
  title =        "Multiple-Speaker Localization Based on Direct-Path
                 Features and Likelihood Maximization With Spatial
                 Sparsity Regularization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "1997--2012",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Marc Arnela and Oriol Guasch",
  title =        "Finite Element Synthesis of Diphthongs Using Tuned
                 Two-Dimensional Vocal Tracts",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "2013--2023",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Deepak Baby and Hugo {Van hamme}",
  title =        "Joint Denoising and Dereverberation Using
                 Exemplar-Based Sparse Representations and Decaying Norm
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "2024--2035",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "2036--2037",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "2038--2039",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "2040",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "C1",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "C2",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "C3",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "10",
  pages =        "C4",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2041--2042",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2043--2044",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Qinghua Huang and Lin Zhang and Yong Fang",
  title =        "Two-Stage Decoupled {DOA} Estimation Based on Real
                 Spherical Harmonics for Spherical Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2045--2058",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Tomoki Hayashi and Shinji Watanabe and Tomoki Toda and
                 Takaaki Hori and Jonathan {Le Roux} and Kazuya Takeda",
  title =        "Duration-Controlled {LSTM} for Polyphonic Sound Event
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2059--2070",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Monisankha Pal and Goutam Saha",
  title =        "Spectral Mapping Using Prior Re-Estimation of
                 $i$-Vectors and System Fusion for Voice Conversion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2071--2084",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Seppo Enarvi and Peter Smit and Sami Virpioja and
                 Mikko Kurimo",
  title =        "Automatic Speech Recognition With Very Large
                 Conversational {Finnish} and {Estonian} Vocabularies",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2085--2097",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Hannah Muckenhirn and Pavel Korshunov and Mathew
                 Magimai-Doss and S{\'e}bastien Marcel",
  title =        "Long-Term Spectral Statistics for Voice Presentation
                 Attack Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2098--2111",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Brian Hamilton and Stefan Bilbao",
  title =        "{FDTD} Methods for {$3$-D} Room Acoustics Simulation
                 With High-Order Accuracy in Space and Time",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2112--2124",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Pejman Mowlaee and Martin Blass and W. Bastiaan
  title =        "New Results in Modulation-Domain Single-Channel Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2125--2137",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Dylan Menzies and Filippo Maria Fazi",
  title =        "Decoding and Compression of Channel and Scene Objects
                 for Spatial Audio",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2138--2151",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Eunwoo Song and Frank K. Soong and Hong-Goo Kang",
  title =        "Effective Spectral and Excitation Modeling Techniques
                 for {LSTM--RNN}-Based Speech Synthesis Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2152--2161",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Pulkit Sharma and Vinayak Abrol and Anil Kumar Sao",
  title =        "Deep-Sparse-Representation-Based Features for Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2162--2175",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Iynkaran Natgunanathan and Yong Xiang and Guang Hua
                 and Gleb Beliakov and John Yearwood",
  title =        "Patchwork-Based Multilayer Audio Watermarking",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2176--2187",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Chengzhu Yu and John H. L. Hansen",
  title =        "Active Learning Based Constrained Clustering For
                 Speaker Diarization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2188--2198",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Emil Solsb{\ae}k Ottosen and Monika D{\"o}rfler",
  title =        "A Phase Vocoder Based on Nonstationary {Gabor}
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2199--2208",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Boaz Schwartz and Sharon Gannot and Emanu{\"e}l A. P.
  title =        "Two Model-Based {EM} Algorithms for Blind Source
                 Separation in Noisy Environments",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2209--2222",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Maja Taseska and Emanu{\"e}l A. P. Habets",
  title =        "Nonstationary Noise {PSD} Matrix Estimation for
                 Multichannel Blind Speech Extraction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2223--2236",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Bruno {Di Giorgi} and Simon Dixon and Massimiliano
                 Zanoni and Augusto Sarti",
  title =        "A Data-Driven Model of Tonal Chord Sequence
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2237--2250",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "N. Stefanakis and D. Pavlidi and A. Mouchtaris",
  title =        "Corrections to {``Perpendicular Cross-Spectra Fusion
                 for Sound Source Localization With a Planar Microphone
                 Array'' [Sep 17 1821--1835]}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2251",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  note =         "See \cite{Stefanakis:2017:PCS}.",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2252--2253",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2254--2255",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "2256",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "C1",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "C2",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "C3",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "11",
  pages =        "C4",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2252--2253",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "T. Schultz and T. Hueber and D. J. Krusienski and J.
                 S. Brumberg",
  title =        "Introduction to the Special Issue on Biosignal-Based
                 Spoken Communication",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2254--2256",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Tanja Schultz and Michael Wand and Thomas Hueber and
                 Dean J. Krusienski and Christian Herff and Jonathan S.
  title =        "Biosignal-Based Spoken Communication: a Survey",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2257--2271",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Christopher Dromey and Katherine M. Black",
  title =        "Effects of Laryngeal Activity on Articulation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2272--2280",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Michal Borsky and Daryush D. Mehta and Jarrad H. {Van
                 Stan} and Jon Gudnason",
  title =        "Modal and Nonmodal Voice Quality Classification Using
                 Acoustic and Electroglottographic Features",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2281--2291",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Alborz Rezazadeh Sereshkeh and Robert Trott and
                 Aur{\'e}lien Bricout and Tom Chau",
  title =        "{EEG} Classification of Covert Speech Using
                 Regularized Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2292--2300",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Reza Sahraeian and Dirk {Van Compernolle}",
  title =        "Crosslingual and Multilingual Speech Recognition Based
                 on the Speech Manifold",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2301--2312",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "{\Dbar}or{\dbar}e T. Grozdi{\'c} and Slobodan T.
  title =        "Whispered Speech Recognition Using Deep Denoising
                 Autoencoder and Inverse Filtering",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2313--2322",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Myungjong Kim and Beiming Cao and Ted Mau and Jun
  title =        "Speaker-Independent Silent Speech Recognition From
                 Flesh-Point Articulatory Movements Using an {LSTM}
                 Neural Network",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2323--2336",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Patrick Lumban Tobing and Kazuhiro Kobayashi and
                 Tomoki Toda",
  title =        "Articulatory Controllable Speech Modification Based on
                 Statistical Inversion and Production Mappings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2337--2350",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Ingmar Steiner and S{\'e}bastien {Le Maguer} and
                 Alexander Hewer",
  title =        "Synthesis of Tongue Motion and Acoustics From Text
                 Using a Multimodal Articulatory Database",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2351--2361",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Jose A. Gonzalez and Lam A. Cheah and Angel M. Gomez
                 and Phil D. Green and James M. Gilbert and Stephen R.
                 Ell and Roger K. Moore and Ed Holdsworth",
  title =        "Direct Speech Reconstruction From Articulatory Sensor
                 Data by Machine Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2362--2374",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Matthias Janke and Lorenz Diener",
  title =        "{EMG}-to-Speech: Direct Generation of Speech From
                 Facial Electromyographic Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2375--2385",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Geoffrey S. Meltzner and James T. Heaton and Yunbin
                 Deng and Gianluca {De Luca} and Serge H. Roy and Joshua
                 C. Kline",
  title =        "Silent Speech Recognition as an Alternative
                 Communication Device for Persons With Laryngectomy",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2386--2398",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Fei Chen and Lan Wang and Hui Chen and Gang Peng",
  title =        "Investigations on {Mandarin} Aspiratory Animations
                 Using an Airflow Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2399--2409",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Wayne Xiong and Jasha Droppo and Xuedong Huang and
                 Frank Seide and Michael L. Seltzer and Andreas Stolcke
                 and Dong Yu and Geoffrey Zweig",
  title =        "Toward Human Parity in Conversational Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2410--2423",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Biao Zhang and Deyi Xiong and Jinsong Su and Hong
  title =        "A Context-Aware Recurrent Encoder for Neural Machine
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2424--2432",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Afsaneh Asaei and Milos Cernak and Herv{\'e}
  title =        "Perceptual Information Loss due to Impaired Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2433--2443",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Ning Ma and Tobias May and Guy J. Brown",
  title =        "Exploiting Deep Neural Networks and Head Movements for
                 Robust Binaural Localization of Multiple Sources in
                 Reverberant Environments",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2444--2453",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "List of Reviewers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2454--2457",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2458--2459",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2460--2461",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2462",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "2017 Subject Index {{\booktitle{IEEE Transactions on
                 Applied Superconductivity}}} Vol. 27",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "2463--2488",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "C1",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "C2",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "C3",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "25",
  number =       "12",
  pages =        "C4",
  month =        "????",
  year =         "2017",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:32 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "1--2",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents {[Edics]}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "3--4",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Dianna Yee and Homayoun Kamkar-Parsi and Rainer Martin
                 and Henning Puder",
  title =        "A Noise Reduction Postfilter for Binaurally Linked
                 Single-Microphone Hearing Aids Utilizing a Nearby
                 External Microphone",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "5--18",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Tom B{\"a}ckstr{\o}m and Johannes Fischer",
  title =        "Fast Randomization for Distributed Low-Bitrate Coding
                 of Speech and Audio",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "19--30",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Jun Deng and Xinzhou Xu and Zixing Zhang and Sascha
                 Fr{\"u}hholz and Bj{\"o}rn Schuller",
  title =        "Semisupervised Autoencoders for Speech Emotion
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "31--43",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Md. Sahidullah and Dennis Alexander Lehmann Thomsen
                 and Rosa Gonzalez Hautam{\"a}ki and Tomi Kinnunen and
                 Zheng-Hua Tan and Robert Parts and Martti
  title =        "Robust Voice Liveness Detection and Speaker
                 Verification Using Throat Microphones",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "44--56",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Gilles Degottex and Pierre Lanchantin and Mark Gales",
  title =        "A Log Domain Pulse Model for Parametric Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "57--70",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Johannes Abel and Tim Fingscheidt",
  title =        "Artificial Speech Bandwidth Extension Using Deep
                 Neural Networks for Wideband Spectral Envelope
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "71--83",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Yuki Saito and Shinnosuke Takamichi and Hiroshi
  title =        "Statistical Parametric Speech Synthesis Incorporating
                 Generative Adversarial Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "84--96",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Kristian Timm Andersen and Marc Moonen",
  title =        "Robust Speech-Distortion Weighted Interframe {Wiener}
                 Filters for Single-Channel Noise Reduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "97--107",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Chen-Yu Chiang",
  title =        "Cross-Dialect Adaptation Framework for Constructing
                 Prosodic Models for {Chinese} Dialect Text-to-Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "108--121",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Bingquan Liu and Zhen Xu and Chengjie Sun and Baoxun
                 Wang and Xiaolong Wang and Derek F. Wong and Min
  title =        "Content-Oriented User Modeling for Personalized
                 Response Ranking in Chatbots",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "122--133",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Zhiyuan Tang and Dong Wang and Yixiang Chen and
                 Lantian Li and Andrew Abel",
  title =        "Phonetic Temporal Neural Model for Language
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "134--144",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Soumitro Chakrabarty and Emanu{\"e}l A. P. Habets",
  title =        "A {Bayesian} Approach to Informed Spatial Filtering
                 With Robustness Against {DOA} Estimation Errors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "145--160",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Kuan-Yu Chen and Shih-Hung Liu and Berlin Chen and
                 Hsin-Min Wang",
  title =        "An Information Distillation Framework for Extractive
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "161--170",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Ma Jin and Yan Song and Ian McLoughlin and Li-Rong
  title =        "{LID}-Senones and Their Statistics for Language
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "171--183",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Zhehuai Chen and Jasha Droppo and Jinyu Li and Wayne
  title =        "Progressive Joint Modeling in Unsupervised
                 Single-Channel Overlapped Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "184--196",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Shivesh Ranjan and John H. L. Hansen",
  title =        "Curriculum Learning Based Approaches for Noise Robust
                 Speaker Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "1",
  pages =        "197--210",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Yoshiaki Bando and Katsutoshi Itoyama and Masashi
                 Konyo and Satoshi Tadokoro and Kazuhiro Nakadai and
                 Kazuyoshi Yoshii and Tatsuya Kawahara and Hiroshi G.
  title =        "Speech Enhancement Based on {Bayesian} Low-Rank and
                 Sparse Decomposition of Multichannel Magnitude
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "215--230",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Yu-Ping Ruan and Qian Chen and Zhen-Hua Ling",
  title =        "A Sequential Neural Encoder With Latent Structured
                 Description for Modeling Sentences",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "231--242",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Amelia J. Gully and Helena Daffern and Damian T.
  title =        "Diphthong Synthesis Using the Dynamic {$3$D} Digital
                 Waveguide Mesh",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "243--255",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Chunyang Wu and Mark J. F. Gales and Anton Ragni and
                 Penny Karanasou and Khe Chai Sim",
  title =        "Improving Interpretability and Regularization in Deep
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "256--265",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Kehai Chen and Tiejun Zhao and Muyun Yang and Lemao
                 Liu and Akihiro Tamura and Rui Wang and Masao Utiyama
                 and Eiichiro Sumita",
  title =        "A Neural Approach to Source Dependence Based Context
                 Model for Statistical Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "266--280",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Joonas Nikunen and Aleksandr Diment and Tuomas
  title =        "Separation of Moving Sound Sources Using Multichannel
                 {NMF} and Acoustic Tracking",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "281--295",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Johan Sw{\"a}rd and Hongbin Li and Andreas Jakobsson",
  title =        "Off-Grid Fundamental Frequency Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "296--303",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Dylan Menzies and Marcos F. Sim{\'o}n G{\'a}lvez and
                 Filippo Maria Fazi",
  title =        "A Low-Frequency Panning Method With Compensation for
                 Head Rotation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "304--317",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Branimir Dropulji{\'c} and Igor Miji{\'c} and Davor
                 Petrinovi{\'c} and Tanja Jovanovic and Kre{\v{s}}imir
  title =        "Vocal Analysis of Acoustic Startle Responses",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "318--329",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Philipp Aichinger and Martin Hagm{\"u}ller and Berit
                 Schneider-Stickler and Jean Schoentgen and Franz
  title =        "Tracking of Multiple Fundamental Frequencies in
                 Diplophonic Voices",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "330--341",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anastasios Alexandridis and Athanasios Mouchtaris",
  title =        "Multiple Sound Source Location Estimation in Wireless
                 Acoustic Sensor Networks Using {DOA} Estimates: The
                 Data-Association Problem",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "342--356",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Robert Rehr and Timo Gerkmann",
  title =        "On the Importance of Super-{Gaussian} Speech Priors
                 for Machine-Learning Based Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "357--366",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Sonia Djaziri-Larbi and Ga{\"e}l Mah{\'e} and Imen
                 Mezghani and Monia Turki and M{\'e}riem Ja{\"\i}dane",
  title =        "Watermark-Driven Acoustic Echo Cancellation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "367--378",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    ";
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Annamaria Mesaros and Toni Heittola and Emmanouil
                 Benetos and Peter Foster and Mathieu Lagrange and
                 Tuomas Virtanen and Mark D. Plumbley",
  title =        "Detection and Classification of Acoustic Scenes and
                 Events: Outcome of the {DCASE 2016 Challenge}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "379--393",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Cheng-Tao Chung and Lin-Shan Lee",
  title =        "Unsupervised Discovery of Structured Acoustic Tokens
                 With Applications to Spoken Term Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "394--405",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Tobias May",
  title =        "Robust Speech Dereverberation With a Neural
                 Network-Based Post-Filter That Exploits
                 Multi-Conditional Training of Binaural Cues",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "406--414",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Majid Mirbagheri and Les Atlas and Adrian K. C. Lee",
  title =        "Regression Factor Analysis With an Application to
                 Continuous {HRIR} Measurement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "415--421",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Jen-Tzung Chien",
  title =        "{Bayesian} Nonparametric Learning for Hierarchical and
                 Sparse Topics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "422--435",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Johannes Stahl and Pejman Mowlaee",
  title =        "A Pitch-Synchronous Simultaneous Detection-Estimation
                 Framework for Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "2",
  pages =        "436--450",
  month =        "????",
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Jan 20 08:35:33 MST 2018",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "C1--C1",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "C2--C2",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "457--458",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents [Edics]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "459--460",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "C. D. Salvador and S. Sakamoto and J. Trevi{\~n}o and
                 Y. Suzuki",
  title =        "Boundary Matching Filters for Spherical Microphone and
                 Loudspeaker Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "461--474",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic field; Acoustics; Array signal processing;
                 array signal processing; Boundary conditions; boundary
                 matching filters; Fourier transforms; Helmholtz
                 equations; high-definition spatial audio;
                 high-resolution arrays; integral equations; KHIE;
                 Kirchhoff Helmholtz integral equation;
                 Kirchhoff-Helmholtz integral equation; loudspeaker
                 array signals; loudspeaker arrays; Loudspeakers;
                 loudspeakers; matched filters; microphone array
                 signals; Microphone arrays; microphone arrays; open
                 reproduction boundary; physical boundary conditions;
                 rigid recording boundary; sound field reconstruction;
                 sound field recording; sound field reproduction; sound
                 fields; Spatial audio; spatial discretization effects;
                 spatial effects; spectral effects; spherical array;
                 spherical array signal conversion; spherical Fourier
                 transform; spherical harmonic functions; spherical
                 microphone; temporal effects; transform domain;
                 transform-domain signal conversion filters",

  author =       "A. H. Abdelaziz",
  title =        "Comparing Fusion Models for {DNN}-Based Audiovisual
                 Continuous Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "475--484",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustics; audio-visual systems; audiovisual automatic
                 speech recognition; audiovisual automatic speech
                 recognition (AV-ASR) benchmarks; audiovisual continuous
                 speech recognition; audiovisual fusion; audiovisual
                 fusion models; Audiovisual speech recognition;
                 automatic lipreading; clean-train-clean-test;
                 clean-train-noisy-test; coupled HMM; decision fusion
                 model; feature fusion model; hidden Markov models;
                 Hidden Markov models; Markov model; multistream hidden
                 Markov model (HMM); neural nets; Noise measurement;
                 noisy acoustic signals; novel LVCSR AV-ASR models;
                 phone recognition; Speech; speech recognition; Speech
                 recognition; turbo decoders; Visualization; vocabulary
                 continuous speech recognition models",

  author =       "S. Emura",
  title =        "Residual Echo Reduction for Multichannel Acoustic Echo
                 Cancelers With a Complex-Valued Residual Echo
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "485--500",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; Acoustics; AEC; bias
                 model; Coherence; coherence estimation; complex-valued
                 residual echo estimate; conventional residual echo
                 reduction methods; echo reduction; echo suppression;
                 echo-path change; far-end signals; far-end talker
                 change; frequency responses; Frequency-domain analysis;
                 Loudspeakers; Microphones; Multichannel acoustic echo
                 canceler; multichannel acoustic echo cancelers;
                 residual echo; Speech; speech processing; Speech
                 processing; Wiener filters",

  author =       "V. H. Do and N. F. Chen and B. P. Lim and M. A.
  title =        "Multitask Learning for Phone Recognition of
                 Underresourced Languages Using Mismatched
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "501--514",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic modeling; acoustic signal processing;
                 Acoustics; Adaptation models; annotation language; Data
                 models; Gaussian Mixture Model; Gaussian processes;
                 hidden Markov models; Hidden Markov models;
                 Hidden-Markov Model; learning (artificial
                 intelligence); matched target-language graphemes;
                 mismatched annotation-language graphemes; mismatched
                 transcription; multi-task learning; multitask learning
                 framework; natural language processing; neural nets;
                 Phone recognition; Probabilistic logic; probabilistic
                 transcription; Speech; speech audio; speech processing;
                 speech recognition; Speech recognition; under-resourced
                 languages; underresourced language",

  author =       "M. Zohourian and G. Enzner and R. Martin",
  title =        "Binaural Speaker Localization Integrated Into an
                 Adaptive Beamformer for Hearing Aids",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "515--528",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "adaptive binaural beamformer; array signal processing;
                 Array signal processing; Azimuth; beamforming;
                 beamforming techniques; binaural hearing aids; binaural
                 localization; Binaural source localization; binaural
                 speaker localization; Cost function;
                 Direction-of-arrival estimation; direction-of-arrival
                 estimation; Estimation; feature extraction; hearing
                 aids; hearing-aids; interference suppression;
                 localization algorithms; maximum likelihood estimation;
                 Microphones; source separation; speaker recognition;
                 Speech; speech enhancement",

  author =       "Y. Xiang and I. Natgunanathan and D. Peng and G. Hua
                 and B. Liu",
  title =        "Spread Spectrum Audio Watermarking Using Multiple
                 Orthogonal {PN} Sequences and Variable Embedding
                 Strengths and Polarities",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "529--539",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio coding; audio data; audio signal; audio signal
                 processing; Audio watermarking; audio watermarking;
                 compression attacks; copyright; Copyright protection;
                 copyright protection; Discrete cosine transforms;
                 Electronic mail; embedding capacity; existing audio
                 watermarking methods; high robustness; Interference;
                 Multiple Orthogonal PN Sequences; noise addition;
                 Robustness; Speech; spread spectrum; spread spectrum
                 audio watermarking; SS-based audio watermarking method;
                 Variable Embedding Strengths; watermark bits;

  author =       "C. Tan and F. Wei and Q. Zhou and N. Yang and B. Du
                 and W. Lv and M. Zhou",
  title =        "Context-Aware Answer Sentence Selection With
                 Hierarchical Gated Recurrent Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "540--549",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Analytical models; answer sentence selection;
                 artificial intelligence; candidate sentence;
                 comprehension style answer sentence selection; context
                 independent matching; context information; Context
                 modeling; context-aware answer sentence selection;
                 hierarchical gated recurrent neural networks;
                 hierarchical neural networks; Logic gates; natural
                 language processing; Question answering; question
                 answering (information retrieval); recurrent neural
                 nets; Recurrent neural networks; Semantics; sentence
                 level recurrent neural network; SQuAD datasets; WikiQA
                 datasets; word level recurrent neural network",

  author =       "J. Zhang and S. P. Chepuri and R. C. Hendriks and R.
  title =        "Microphone Subset Selection for {MVDR} Beamformer
                 Based Noise Reduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "550--563",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "array signal processing; candidate sensors;
                 computational complexity; convex optimization; convex
                 optimization techniques; convex programming;
                 correlation matrices; correlation methods; data-driven
                 approach; dynamic scenarios; Estimation; greedy
                 algorithm; greedy algorithms; greedy strategy;
                 informative sensors; matrix algebra; microphone subset
                 selection; Microphones; minimum variance distortionless
                 response beamformer based noise reduction; model-driven
                 scheme; MVDR; MVDR beamformer; Noise reduction; noise
                 reduction; output noise power; radius-based beamformer;
                 sensor measurements; Sensor selection; sensor selection
                 problem; Sensors; Signal to noise ratio;
                 signal-to-noise ratio; sparse MVDR; sparsity; Speech;
                 Speech processing; statistical analysis; statistical
                 information; transmission power; WASN; wireless
                 acoustic sensor networks; wireless sensor networks",

  author =       "S. Wang and P. Lin and Y. Tsao and J. Hung and B. Su",
  title =        "Suppression by Selecting Wavelets for Feature
                 Compression in Distributed Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "564--579",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "back-end server; client terminal; compressed features;
                 compression rate; compression stage; data compression;
                 data processing; data transmission efficiency; device
                 requirements; Discrete wavelet transform; discrete
                 wavelet transform; discrete wavelet transforms;
                 Discrete wavelet transforms; distributed speech
                 recognition; down-sampling process; DSR; DWT; feature
                 compression; feature compression algorithm; feature
                 extraction; Feature extraction; feature extraction;
                 feature sequence temporal properties; Frequency
                 modulation; high frequency counterpart; incoming speech
                 feature sequence; incoming stream; low frequency
                 subsequence; low-frequency subsequence; Mandarin
                 Chinese news corpus; memory minimization; mobile
                 device; network server; noise-robustness techniques;
                 oversmoothing effects; recognition performance;
                 recognition tasks; remote network; Servers; specific
                 feature statistics normalization; Speech; Speech
                 recognition; speech recognition; SSW; SSW approach;
                 standard robustness task; statistics; statistics
                 normalization; suppression by selecting wavelets;
                 temporal subsequences; wireless channel; wireless

  author =       "Y. Wang and M. Brookes",
  title =        "Model-Based Speech Enhancement in the Modulation
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "580--594",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "competitive algorithms; complex domain; Cost function;
                 estimated dynamics; Gaussring-model; Kalman filter;
                 Kalman filters; least mean squares methods; minimum
                 mean-square error (MMSE) estimator; MMSE estimation;
                 Modulation; modulation-domain Kalman filter;
                 modulation-domain speech enhancement; noise amplitudes;
                 Noise measurement; segmental SNR measure; short-time
                 objective intelligibility measure; spectral amplitudes;
                 Speech; speech amplitudes; Speech enhancement; speech
                 enhancement; Speech enhancement; speech
                 intelligibility; speech quality measure; speech
                 recognition experiments; statistical Gaussring model;
                 statistical modelling",

  author =       "C. Huemmer and C. Hofmann and R. Maas and W.
  title =        "Estimating Parameters of Nonlinear Systems Using the
                 Elitist Particle Filter Based on Evolutionary
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "595--608",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic distortion; approximated continuous posterior
                 distribution; Atmospheric measurements; Bayes methods;
                 classical particle filtering; elitist particle filter;
                 elitist particles; EPFES; Estimation; evolutionary
                 computation; evolutionary elitist-particle selection
                 scheme; evolutionary strategies; FIR filters; Gaussian
                 particle filter; instantaneously calculated particle
                 weights; latent state vector; linear FIR filter;
                 long-term information; loudspeakers; Loudspeakers;
                 nonlinear acoustic echo path; nonlinear acoustics;
                 nonlinear parameter estimation; nonlinear system;
                 Nonlinear systems; parameter estimation; particle
                 filter; particle filtering (numerical methods);
                 Particle measurements; Probability density function;
                 published elitist-particle selection process;
                 single-channel nonlinear acoustic echo cancellation;
                 State-space model; statistical distributions;
                 time-variant latent state; univariate nonstationary
                 growth model",

  author =       "D. Salvati and C. Drioli and G. L. Foresti",
  title =        "A Low-Complexity Robust Beamforming Using Diagonal
                 Unloading for Acoustic Source Localization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "609--622",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic analysis; acoustic array processing; acoustic
                 arrays; acoustic signal processing; acoustic source
                 localization; Acoustics; array output vector; Array
                 signal processing; array signal processing; broadband
                 robust beamforming; Complexity theory; computational
                 complexity; Covariance matrices; covariance matrices;
                 data-dependent covariance matrix conditioning method;
                 Diagonal unloading beamforming; diagonal unloading
                 transformation method; direction of arrival estimation;
                 DU beamformer localization performance; DU beamformer
                 method; DU beamforming; eigenvalues and eigenfunctions;
                 filtering theory; low-complexity robust beamforming;
                 microphone array; Multiple signal classification;
                 multiple signal classification method; noisy signal
                 space; opportune diagonal matrix; radiating sound
                 source; real acoustic data; response power beamforming;
                 robust localization; robust minimum variance
                 distortionless response filter; Robustness; Sensors;
                 signal classification; signal subspace",

  author =       "J. Su and J. Zeng and D. Xiong and Y. Liu and M. Wang
                 and J. Xie",
  title =        "A Hierarchy-to-Sequence Attentional Neural Machine
                 Translation Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "623--632",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "attention models; Chinese-English translation; clause
                 level; Context modeling; conventional NMT model;
                 Decoding; English-German translation; grammars;
                 hierarchical neural network structure;
                 Hierarchy-to-sequence; hierarchy-to-sequence
                 attentional neural machine translation model;
                 hierarchy-to-sequence attentional NMT model; language
                 translation; learning (artificial intelligence); long
                 parallel sentences; natural language processing; neural
                 machine translation; neural nets; optimal model
                 parameters; parameter learning; recurrent neural nets;
                 Recurrent neural networks; recurrent neural networks;
                 segmented clause sequence; segmented clauses; semantic
                 compositionality modeling; Semantics;
                 sequence-to-sequence attentional neural machine
                 translation; short clauses; Speech; Speech processing;
                 text analysis; Training; translation prediction",

  author =       "W. B. Kheder and D. Matrouf and M. Ajili and J.
  title =        "A Unified Joint Model to Deal With Nuisance
                 Variabilities in the $i$-Vector Space",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "633--645",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic corruptions; acoustic nuisances; acoustic
                 signal processing; Acoustics; Additive noise; additive
                 noise; baseline system performance; Computational
                 modeling; corrupted test i-vector; data-driven nuisance
                 compensation technique; i-vector; i-vector space;
                 i-vectors framework; joint modeling; least mean squares
                 methods; nuisance variabilities; Robustness; short
                 utterance; speaker recognition; speaker recognition
                 technology; Speaker verification; Speech; Speech
                 processing; SR systems; Training; unified joint model;

  author =       "G. Gelly and J. Gauvain",
  title =        "Optimization of {RNN}-Based Speech Activity
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "646--656",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Artificial neural networks; automatic speech
                 recognition systems; back-end parameters; CG-LSTM
                 model; coordinated-gate LSTM network; downstream speech
                 recognizer; Error analysis; feature extraction; frame
                 error rate; long short-term memory; NIST 2015 SAD
                 evaluation data; NIST detection cost function;
                 nondifferentiable optimization problems; Optimization;
                 particle swarm optimisation; particle swarm
                 optimization; recurrent neural nets; recurrent neural
                 network; Recurrent neural networks; recurrent neural
                 networks; RNN models; SAD optimization; short-term
                 memory network; Smoothing methods; Speech; Speech
                 activity detection; speech activity detection; speech
                 recognition; word error rate",

  author =       "M. Taseska and E. A. P. Habets",
  title =        "Blind Source Separation of Moving Sources Using
                 Sparsity-Based Source Detection and Tracking",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "657--670",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic source tracking; approximate Bayesian
                 tracker; Bayes methods; blind source separation; blind
                 source separation algorithms; BSS filters; estimated
                 statistics; independent vector analysis-based BSS
                 algorithms; measurement-to-source association
                 probabilities; microphone arrays; Microphone arrays;
                 Narrowband; noise reduction capabilities; optimal
                 spatial filters; pattern clustering; Position
                 measurement; probability; PSD matrix estimation; short
                 time-frequency domain; source separation; source
                 signals; Spatial filtering; spatial filters; spatially
                 separated microphone arrays; Speech; Speech processing;
                 TF bin associations; time-frequency bin",

  author =       "L. Yu and J. Wang and K. R. Lai and X. Zhang",
  title =        "Refining Word Embeddings Using Intensity Scores for
                 Sentiment Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "671--681",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Context modeling; dissimilar intensity scores;
                 fine-grained sentiment classification; labeled corpora;
                 low-dimensional vector representations; natural
                 language processing tasks; Neural networks; opposite
                 sentiment polarity; pretrained word embeddings;
                 pretrained word vectors; refinement process; Semantics;
                 Sentiment analysis; sentiment analysis; Sentiment
                 analysis; sentiment embeddings; sentiment intensity
                 scores; sentiment lexicons; sentimentally dissimilar
                 words; Speech; Speech processing; sufficient sentiment
                 information; word embeddings; word vector refinement;
                 word vector refinement model; Word2vec",

  author =       "Y. Dorfan and A. Plinge and G. Hazan and S. Gannot",
  title =        "Distributed Expectation-Maximization Algorithm for
                 Speaker Localization in Reverberant Environments",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "682--695",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustic measurements; acoustic radiators; acoustic
                 source localization; active speakers; auditory scene
                 analysis; complex-valued Gaussian mixture model;
                 Direction-of-arrival estimation; distributed
                 algorithms; distributed expectation-maximization;
                 Estimation; expectation-maximisation algorithm; extreme
                 conditions; filter the measurements; Gaussian
                 processes; hearing; high localization accuracy; human
                 hearing mechanisms; incremental
                 expectation-maximization; Microphones; mixture models;
                 modified incremental distributed
                 expectation-maximization algorithm; multi-path;
                 multipath conditions; multiple subbands; onset
                 dominance; original IDEM framework; phase difference
                 measurements; Precedence effect; real-valued truncated
                 Gaussian mixture; reverberant environments;
                 reverberation; Reverberation; sound source
                 localization; speaker localization; spectral masking;
                 Speech; speech processing; Speech processing; time
                 difference of arrival; time difference of arrival
                 measurements; time-of-arrival estimation; truncated

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "696--697",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "698--699",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "700--700",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Introducing {IEEE Collabratec}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "701--701",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "C3--C3",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "3",
  pages =        "C4--C4",
  month =        mar,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "C1--C1",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "C2--C2",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "696--697",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents [Edics]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "698--699",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Z. Tan and M. Mak and B. K. Mak",
  title =        "{DNN}-Based Score Calibration With Multitask Learning
                 for Noise Robust Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "700--712",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "calibration; Calibration; calibration algorithms;
                 conventional calibration methods; conventional
                 score-shift approch; Deep learning; deep neural
                 network; DNN approach; DNN-based score calibration;
                 i-vector pairs; i-vector speaker verification systems;
                 learning (artificial intelligence); multi-task
                 learning; multitask DNNs; multitask learning; neural
                 nets; Noise measurement; noise robust speaker
                 verification; noise robustness; Noise robustness; noise
                 robustness; score calibration; Signal to noise ratio;
                 speaker ID; speaker recognition; speaker verification;
                 Speech; Training; uncalibrated scores",

  author =       "Y. Hu and Z. Ling",
  title =        "Extracting Spectral Features Using Deep Autoencoders
                 With Binary Distributed Hidden Units for Statistical
                 Parametric Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "713--724",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic modeling; Acoustics; BDAE training method;
                 belief networks; binary distributed hidden units; DAE;
                 Decoding; Deep auto-encoder; deep autoencoders; deep
                 belief network; Feature extraction; feature extraction;
                 feedforward deep neural networks; feedforward neural
                 nets; Hidden Markov models; model training; Neural
                 networks; parameter generation; raw features; spectral
                 envelopes; spectral feature extraction method; Speech;
                 speech synthesis; SPSS systems; statistical parametric
                 speech synthesis; Training",

  author =       "B. Laufer-Goldshtein and R. Talmon and S. Gannot",
  title =        "A Hybrid Approach for Speaker Tracking Based on {TDOA}
                 and Data-Driven Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "725--735",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic channel variation; Acoustic measurements;
                 acoustic signal processing; Acoustics; associated
                 source position; associated TDOA readings; data
                 modalities; data-driven propagation model; distributed
                 microphone pairs; extended Kalman filter; extended
                 Kalman filter (EKF); Gaussian process; Gaussian
                 processes; high-dimensional acoustic feature
                 representation; Kalman filters; learning-based
                 approach; low-dimensional time difference of arrival
                 estimation; Manifolds; Microphones; microphones; noisy
                 enclosures; nonlinear filters; observation model;
                 observation models; relative transfer function (RTF);
                 reverberant acoustic channels; reverberant enclosures;
                 reverberation; signal representation; Speaker tracking;
                 speaker tracking schemes; Speech; speech processing;
                 Speech processing; state-space representation;
                 statistical analysis; statistical model; TDOA
                 estimation; time difference of arrival (TDOA);
                 time-of-arrival estimation; Training",

  author =       "S. Cumani and P. Laface",
  title =        "Speaker Recognition Using e Vectors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "736--748",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "accurate speaker subspace; Adaptation models; e-vector
                 subspace; e-vectors; e-vectors systems; eigenvoice;
                 Estimation; i vectors; i-vector systems; i-vector
                 training; informative speaker subspace; intersession
                 subspaces; JFA; joint factor analysis; low-dimensional
                 subspace; speaker factors; speaker modeling approach;
                 speaker recognition; Speaker recognition; speaker
                 recognition evaluations; Speech; Speech processing;
                 speech segment; Standards; text-independent speaker
                 recognition; total variability i- vector subspace;
                 Training; training segment; vectors",

  author =       "L. Xu and K. A. Lee and H. Li and Z. Yang",
  title =        "Generalizing {I}-Vector Estimation for Rapid Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "749--759",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Baum-Welch statistics; compact representation;
                 Computational modeling; Covariance matrices; covariance
                 matrices; Estimation; factor representation; Gaussian
                 processes; i-vector estimation; i-vector Gaussian
                 formulation; Load modeling; Loading; NIST SRE 10;
                 posterior covariance matrix; rapid computation; SOP
                 approach; speaker recognition; Speaker verification;
                 Speech; spoken utterance; Standards;
                 subspace-orthogonalizing prior; text-independent
                 speaker recognition; total variability model; vectors",

  author =       "Y. Buchris and I. Cohen and J. Benesty",
  title =        "Frequency-Domain Design of Asymmetric Circular
                 Differential Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "760--773",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "array signal processing; asymmetric beampatterns;
                 asymmetric circular differential microphone arrays;
                 broadband beamforming; Circular differential microphone
                 arrays; Frequency-domain analysis; frequency-domain
                 analysis; frequency-domain design; Geometry;
                 hypercardioid; microphone arrays; Microphone arrays;
                 Multiaccess communication; Sensor arrays;
                 supercardioid; superdirective beamformers",

  author =       "J. Zhang and T. D. Abhayapala and W. Zhang and P. N.
                 Samarasinghe and S. Jiang",
  title =        "Active Noise Control Over Space: a Wave Domain
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "774--786",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic potential energy reduction level; acoustic
                 signal processing; active noise control; Active noise
                 control (ANC); Adaptive algorithms; control region;
                 fundamental problem; Harmonic analysis; loudspeaker
                 weights; Loudspeakers; loudspeakers; Microphone arrays;
                 minimisation; minimization problems; multichannel;
                 Noise cancellation; noise cancellation performance;
                 noise reduction level; Potential energy; primary noise
                 field; reverberant room; secondary source driving
                 signals; signal denoising; spatial noise; wave domain;
                 wave domain approach; wave-domain active noise control
                 algorithms; wave-domain adaptive algorithms;
                 wave-domain residual signal coefficients; wave-domain
                 secondary source coefficients",

  author =       "Y. Luo and Z. Chen and N. Mesgarani",
  title =        "Speaker-Independent Speech Separation With Deep
                 Attractor Network",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "787--796",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "attractor network; corresponding attractor point; deep
                 attractor network; deep clustering; deep learning
                 framework; deep learning methods; high-dimensional
                 embedding space; learning (artificial intelligence);
                 Machine learning; masker speakers; multi-talker; neural
                 nets; Neural networks; output dimension problem;
                 reference point; signal reconstruction; signal
                 representation; Source separation; source separation;
                 speaker mixtures; speaker-independent speech
                 separation; Spectrogram; Speech; Speech processing;
                 speech processing; speech recognition; standard signal
                 reconstruction; Time-frequency analysis; time-frequency
                 assignment; time-frequency embeddings; time-frequency

  author =       "N. M. Joy and S. R. Kothinti and S. Umesh",
  title =        "{FMLLR} Speaker Normalization With {i-Vector}: In
                 Pseudo-{FMLLR} and Distillation Framework",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "797--805",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic modeling; acoustic signal processing;
                 Acoustics; ASR task; augmenting i-vectors; automatic
                 speech recognition system; decoding; deep neural
                 networks; distillation; DNN acoustic model training;
                 Feature extraction; feature-space maximum likelihood
                 linear regression; FMLLR speaker normalization;
                 generalized distillation framework; Hidden Markov
                 models; i-vector; i-vector appended filterbank
                 features; maximum likelihood estimation; neural nets;
                 pseudo-FMLLR; pseudoFMLLR features; real-time scenario;
                 regression analysis; single utterance; Speaker
                 normalization; speaker normalizing methods; speaker
                 recognition; speaker-specific FMLLR; Speech; Speech
                 processing; Switchboard; time-synchronous pair;
                 Training; Transforms; un-supervised; unsupervised
                 speaker normalization techniques",

  author =       "S. Chandna and W. Wang",
  title =        "Bootstrap Averaging for Model-Based Source Separation
                 in Reverberant Conditions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "806--819",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Analytical models; audio signal processing; bootstrap
                 averaging; expectation maximization (EM) algorithm;
                 expectation maximization estimates;
                 expectation-maximisation algorithm; frequency domain
                 Gaussian mixture model; frequency-dependent GMM
                 parameter estimates; frequency-domain analysis;
                 Gaussian mixture model (GMM); Gaussian processes;
                 mixture models; model-based source separation;
                 parameter estimation; reverberant conditions;
                 reverberant speech mixtures; Reverberation;
                 reverberation; source separation; Source separation;
                 spectral histogram; Speech; Speech processing; speech
                 processing; statistical analysis; T-F masks;
                 time-frequency (T-F) masking; Time-frequency analysis;
                 time-frequency masks",

  author =       "Z. Tan and M. Mak and B. K. Mak and Y. Zhu",
  title =        "Denoised {Senone} {I}-Vectors for Robust Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "820--830",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; backpropagation;
                 backpropagation fine-tuning; belief networks; deep
                 architecture; deep belief network; deep learning;
                 denoised senone i-vectors; denoising autoencoder;
                 denoising autoencoders; feature extraction; Feature
                 extraction; i-vector extraction process; i-vectors;
                 neural nets; Noise measurement; Noise reduction; noise
                 robustness; noisy environments; phonetically
                 discriminative acoustic features; phonetically
                 discriminative features; Robustness; senone deep neural
                 networks; senone posterior estimation; senone
                 posteriors; signal denoising; speaker recognition;
                 Speaker recognition; Speaker Verification; Speaker
                 verification; Speech; Training",

  author =       "K. Itakura and Y. Bando and E. Nakamura and K. Itoyama
                 and K. Yoshii and T. Kawahara",
  title =        "{Bayesian} Multichannel Audio Source Separation Based
                 on Integrated Source and Spatial Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "831--846",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio signal processing; basis spectra weighted sum;
                 Bayes methods; Bayesian models; Bayesian multichannel
                 audio source separation; blind source separation;
                 Computational modeling; Covariance matrices;
                 factor-factor models; factor-mixture models; Gibbs
                 sampling algorithms; hierarchical Bayesian models;
                 Indexes; integrated source; latent Dirichlet
                 allocation; latent source spectrograms; matrix
                 decomposition; microphone array; microphone arrays;
                 Mixture models; mixture-factor models; mixture-mixture
                 models; Multichannel source separation; nonnegative
                 matrix factorization; observed mixture spectrograms;
                 source model; Source separation; source separation;
                 source-spatial combinations; spatial factor model;
                 spatial mixture model; spatial model; Spectrogram;
                 statistical analysis; TF bin; time-frequency bin;
                 unified models; unified source",

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "847--848",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "849--850",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Open Access",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "851--851",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Introducing {IEEE Collabratec}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "852--852",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "C3--C3",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "4",
  pages =        "C4--C4",
  month =        apr,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "853--854",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents [Edics]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "855--856",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Y. E. Baba and A. Walther and E. A. P. Habets",
  title =        "{$3$D} Room Geometry Inference Based on Room Impulse
                 Response Stacks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "857--872",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "3D room geometry inference; acoustic signal
                 processing; acoustic wave reflection; architectural
                 acoustics; direction-of-arrival estimation; echo
                 labeling; Geometry; geometry; image microphones; Image
                 model; Labeling; loudspeaker array geometry;
                 loudspeakers; Loudspeakers; loudspeakers; Microphone
                 arrays; microphones; real image microphone positions;
                 reflection point localization; reflection points;
                 reflective boundaries; reflector localization; room
                 geometry inference; room impulse response stacks;
                 single microphone; Three-dimensional displays; TOA
                 disambiguation; transient response; Two dimensional

  author =       "Q. Zhang and J. H. L. Hansen",
  title =        "Language\slash Dialect Recognition Based on
                 Unsupervised Deep Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "873--882",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustics; additional transcribed speech information;
                 adversarial autoencoder; Arabic dialect corpus;
                 bottleneck feature; dialect recognition; estimated
                 phonetic labels; feature extraction; Feature
                 extraction; generative modeling autoencoder; Hidden
                 Markov models; i-Vector framework; Language/Dialect
                 recognition; latent variable learning algorithms;
                 natural language processing; phonetic label estimation;
                 Speech; speech coding; speech feature processing;
                 speech processing; Speech processing; speech
                 recognition; Speech recognition; state-of-the-art
                 language/dialect; Training; unsupervised bottleneck
                 feature extraction approach; unsupervised deep learning
                 methods; unsupervised learning; variational

  author =       "Z. Ling and Y. Ai and Y. Gu and L. Dai",
  title =        "Waveform Modeling and Generation Using Hierarchical
                 Recurrent Neural Networks for Speech Bandwidth
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "883--894",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "bottleneck features; BWE method models; conventional
                 BWE methods; deep neural network; dilated convolutional
                 neural network; dilated convolutional neural networks;
                 feedforward neural nets; generated wideband speech;
                 generation method; Hidden Markov models; hierarchical
                 recurrent neural networks; hierarchical structure;
                 high-frequency waveform sample; HRNN model; input
                 narrowband waveform samples; LSTM layers; Narrowband;
                 narrowband speech; plain sample-level recurrent neural
                 network based method; reconstructed wideband speech;
                 recurrent neural nets; Recurrent neural networks;
                 recurrent neural networks; short-term memory layers;
                 Speech; Speech bandwidth extension; speech bandwidth
                 extension; speech coding; Speech processing; speech
                 quality; speech synthesis; unconditional neural audio
                 generator; vocoders; waveform modeling methods;
                 Wideband; wideband frequency waveform sample; wideband
                 speech waveforms",

  author =       "M. Delcroix and K. Kinoshita and A. Ogawa and C.
                 Huemmer and T. Nakatani",
  title =        "Context Adaptive Neural Network Based Acoustic Models
                 for Rapid Adaptation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "895--908",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic context class; acoustic context information;
                 acoustic model; acoustic model adaptation; Acoustic
                 modeling; Acoustics; Adaptation models; adaptive
                 training; auxiliary feature; auxiliary network; CHiME3
                 data; context adaptive neural network; context class
                 weights; convolutional neural network; deep neural
                 network; environmental adaptation; feedforward neural
                 nets; Hidden Markov models; learning (artificial
                 intelligence); network input; Neural networks; rapid
                 adaptation; speaker adaptation experiments; Speech;
                 speech recognition; speech recognition performance;
                 Training; Training data",

  author =       "L. T. T. Tran and S. E. Nordholm and H. Schepker and
                 H. H. Dam and S. Doclo",
  title =        "Two-Microphone Hearing Aids Using Prediction Error
                 Method for Adaptive Feedback Control",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "909--923",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "adaptive control; Adaptive feedback control; adaptive
                 filter estimates; adaptive filters; added stable gain;
                 AFC applications; AFC2; AFC2 method; Correlation;
                 feedback; Feedback control; feedback path; feedback
                 path estimation; handicapped aids; Hearing aids;
                 hearing aids; loudspeaker signal; loudspeakers;
                 Loudspeakers; microphone signals; Microphones;
                 microphones; misalignment; optimal filters; PEM-AFC;
                 PEM-AFC2; prediction error method; prefilter; relative
                 transfer function; single-microphone single-loudspeaker
                 systems; SMSL systems; Speech; Speech processing;
                 speech processing; speech shaped noise; tracking rate;
                 transfer functions; two-microphone adaptive feedback
                 control method; two-microphone hearing aids;
                 two-microphone single-loudspeaker hearing aid",

  author =       "J. Chang and M. Marschall",
  title =        "Periphony-Lattice Mixed-Order Ambisonic Scheme for
                 Spherical Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "924--936",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic field; acoustic signal processing; array
                 signal processing; Array signal processing; Finite
                 wordlength effects; Harmonic analysis; higher order
                 ambisonics; Higher order ambisonics (HOA); HOA;
                 horizontal performance; horizontal sound waves;
                 horizontally incident sound waves; incident direction;
                 Microphone arrays; microphone arrays; mixed-order
                 ambisonics (MOA); MOA scheme; periphony-lattice
                 mixed-order ambisonic scheme; signal reconstruction;
                 sound field reconstruction; sound field reconstruction
                 performance; Speech; Speech processing; spherical array
                 layouts; spherical array of microphones; spherical
                 beamforming; spherical harmonics coefficients;
                 spherical harmonics expansion; spherical microphone
                 arrays; theoretical truncation error",

  author =       "N. Dionelis and M. Brookes",
  title =        "Phase-Aware Single-Channel Speech Enhancement With
                 Modulation-Domain {Kalman} Filtering",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "937--950",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Correlation; enhanced speech phase spectrum; filtering
                 theory; Fourier transforms; intelligibility metrics;
                 Kalman filter prediction step; Kalman filter update
                 step models; Kalman filters; modulation-domain Kalman
                 filtering; Noise measurement; noise spectral
                 log-amplitudes; nonlinear relations; phase-aware
                 single-channel speech enhancement; phase-sensitive
                 enhancement algorithm; Prediction algorithms; signal
                 reconstruction; Spectral analysis; Speech; Speech
                 enhancement; speech enhancement; Speech enhancement;
                 speech enhancement algorithm; speech log-spectrum;
                 speech phase; speech phase posterior; speech quality",

  author =       "C. Zheng and A. Deleforge and X. Li and W.
  title =        "Statistical Analysis of the Multichannel {Wiener}
                 Filter Using a Bivariate Normal Distribution for Sample
                 Covariance Matrices",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "951--966",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "bivariate normal distribution; Bivariate normal
                 distribution; Correlation; covariance matrices;
                 Covariance matrices; Gaussian distribution; intrinsic
                 correlation coefficient; mean square error methods;
                 minimum variance distortionless response beamformer;
                 multichannel Wiener filter; MWF performance; Noise
                 measurement; noise reduction; Noise reduction; noise
                 sample covariance matrices; normal distribution;
                 probability; probability density function; sample
                 covariance matrix; Sensors; signal sampling;
                 signal-to-noise-ratio; Speech; statistical analysis;
                 Wiener filters",

  author =       "C. Vaz and V. Ramanarayanan and S. Narayanan",
  title =        "Acoustic Denoising Using Dictionary Learning With
                 Spectral and Temporal Regularization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "967--980",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic denoising; Algorithm design and analysis;
                 CMF-WISA cost function; complex NMF; complex
                 nonnegative matrix factorization; dictionary learning;
                 Magnetic resonance imaging; magnetic resonance imaging
                 scans; matrix decomposition; Noise measurement; noise
                 modeling; Noise reduction; noise suppression; noisy
                 spectrum; Real-time MRI; signal denoising; Spatial
                 resolution; Speech; speech enhancement; speech+noise
                 portions; Three-dimensional displays",

  author =       "L. Wang and A. Cavallaro",
  title =        "Pseudo-Determined Blind Source Separation for Ad-hoc
                 Microphone Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "981--994",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; ad hoc networks; Ad hoc
                 networks; Ad-hoc; ad-hoc microphone networks;
                 asynchronous recording; blind source separation; Blind
                 source separation; blind source separation; filtering
                 theory; Frequency-domain analysis; ICA; incrementally
                 source separation; independent component analysis;
                 late-reverberation suppression; microphone arrays;
                 Microphones; nontarget channels; over-determined
                 mixture; overdetermined M $\times$ N mixture; power
                 spectral density; pseudodetermined blind source
                 separation; pseudodetermined mixture model;
                 reference-based permutation alignment scheme;
                 Reverberation; reverberation; sampling rate; signal
                 sampling; sound sources; spectral postfilter; Speech;
                 target channel; time offsets; wireless channels",

  author =       "S. Cumani and P. Laface",
  title =        "Scoring Heterogeneous Speaker Vectors Using Nonlinear
                 Transformations and Tied {PLDA} Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "995--1009",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "class-dependent nonlinear transformation; e-vector;
                 Estimation; Feature extraction; i-vector; NIST;
                 NL-Tied-PLDA; non-linear density transformations;
                 nonlinear tied-PLDA; PLDA; probabilistic linear
                 discriminant analysis; probability; score heterogeneous
                 i-vectors; scoring heterogeneous speaker vectors;
                 speaker recognition; Speaker recognition; Speech;
                 Speech processing; Speech recognition; test i-vectors;
                 text-independent speaker recognition systems; Tied PLDA
                 models; vectors",

  author =       "G. Bernardi and T. {van Waterschoot} and J. Wouters
                 and M. Moonen",
  title =        "Subjective and Objective Sound-Quality Evaluation of
                 Adaptive Feedback Cancellation Algorithms",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "1010--1024",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic feedback; acoustic feedback control;
                 Acoustics; Adaptive feedback cancellation (AFC);
                 adaptive feedback cancellation algorithms; adaptive
                 filters; AFC; application-specific objective measures;
                 audio signal processing algorithms; block normalized
                 least mean square algorithm; feedback; frequency-domain
                 adaptive filter; frequency-domain adaptive filter
                 (FDAF); frequency-domain analysis; Frequency-domain
                 analysis; frequency-domain Kalman filter; Kalman
                 filter; Kalman filters; least mean squares methods;
                 Loudspeakers; music signals; objective sound-quality
                 evaluation; PEM-FDKF; perceptual sound-quality
                 evaluation; Prediction algorithms; prediction-error
                 method; prediction-error method (PEM); Signal
                 processing algorithms; Speech; Speech processing;
                 speech processing; speech signals; statistical
                 analysis; subjective sound-quality evaluation;
                 subjective-evaluation measures",

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "1025--1026",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "1027--1028",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "C1--C1",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "C2--C2",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "C3--C3",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "5",
  pages =        "C4--C4",
  month =        may,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "C1--C1",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "C2--C2",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1025--1026",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents [Edics]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1027--1028",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Kameoka and T. Higuchi and M. Tanaka and L. Li",
  title =        "Nonnegative Matrix Factorization With Basis Clustering
                 Using Cepstral Distance Regularization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1029--1040",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; audio signal processing;
                 audio source separation; Audio source separation; basis
                 clustering; blind source separation; cepstral analysis;
                 cepstral distance regularization; Clustering
                 algorithms; joint optimization approach; Linear
                 programming; magnitude spectrogram; majorization
                 minimization algorithm; matrix decomposition; Mel
                 frequency cepstral coefficient; mel-frequency cepstral
                 coefficient (MFCC); mel-frequency cepstral coefficient
                 domain; MFCC domain; music; musical instruments; NMF
                 approach; nonnegative matrix factorization; nonnegative
                 matrix factorization (NMF); optimisation; Optimization;
                 polyphonic signal; Source separation; Spectrogram; time
                 frame; time-varying amplitudes; underlying audio
                 events; unsupervised instrument-wise source

  author =       "J. Donley and C. Ritz and W. B. Kleijn",
  title =        "Multizone Soundfield Reproduction With Privacy- and
                 Quality-Based Speech Masking Filters",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1041--1055",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic contrast; Acoustics; confidential privacy;
                 equal masking influence; frequency domain speech masker
                 filter designs; Frequency-domain analysis; hearing;
                 intelligibility; long term average speech spectra;
                 Loudspeakers; loudspeakers; low-pass filters; multizone
                 soundfield algorithms; Multizone soundfield
                 reproduction; multizone soundfield reproduction;
                 privacy; Privacy; quality; Silicon carbide; sound
                 reproduction; soundfield reproduction geometry; spatial
                 masking filters; speech; Speech; speech
                 intelligibility; speech intelligibility contrast;
                 speech masking filters; speech privacy; speech
                 processing; Speech processing; speech quality mean
                 opinion scores; target speech multizone reproduction",

  author =       "S. Braun and A. {Kuklasi ski} and O. Schwartz and O.
                 Thiergart and E. A. P. Habets and S. Gannot and S.
                 Doclo and J. Jensen",
  title =        "Evaluation and Comparison of Late Reverberation Power
                 Spectral Density Estimators",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1056--1071",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "array processing; Dereverberation; diffuse sound;
                 Electronic mail; late reverberation power spectral
                 density estimators; late reverberation PSD estimators;
                 Maximum likelihood estimation; Microphones;
                 multichannel Wiener filter; power spectral density
                 estimation; Reverberation; reverberation; reverberation
                 reduction; Spatial coherence; spatio-spectral filters;
                 spectral analysis; Speech; speech enhancement; Speech
                 processing; Wiener filters",

  author =       "E. L. Benaroya and N. Obin and M. Liuni and A. Roebel
                 and W. Raumel and S. Argentieri",
  title =        "Binaural Localization of Multiple Sound Sources by
                 Non-Negative Tensor Factorization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1072--1082",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio signal processing; binaural head; binaural
                 localization; Binaural localization; binaural sound
                 source localization; blind source separation;
                 computational audio scene analysis; Ear; Image
                 analysis; matrix decomposition; multichannel audio
                 signals; multiple sound sources; non-negative tensor
                 factorization; nonnegative factorization; nonnegative
                 tensor factorization; robot audition; Robot kinematics;
                 sound source position; Speech; Speech processing;
                 Tensile stress; tensors",

  author =       "N. Perraudin and N. Holighaus and P. Majdak and P.
  title =        "Inpainting of Long Audio Segments With Similarity
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1083--1094",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Audio imputation; audio inpainting; audio restoration;
                 audio signal processing; audio signals; audio
                 similarity graphs; candidate segment; concealment;
                 concealment of data loss; distorted signal region;
                 Distortion; extensive listening tests; graph theory;
                 intuitive optimization scheme; long audio segments
                 inpainting; long duration data loss compensation; lost
                 content; lost signal region; Multiple signal
                 classification; Music; music; music recovery;
                 optimisation; real-world music signals; Redundancy;
                 signal defects; signal structure; similarity graphs;
                 Speech; Time-frequency analysis; time-persistent
                 spectral similarity",

  author =       "P. Magron and R. Badeau and B. David",
  title =        "Model-Based {STFT} Phase Recovery for Audio Source
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1095--1105",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Approximation algorithms; audio signal processing;
                 audio source separation; auxiliary function method;
                 complex-valued STFT; Fourier transforms; Frequency
                 estimation; Harmonic analysis; iterative source
                 separation procedure; Phase recovery; phase unwrapping;
                 short-time Fourier transform; sinusoidal modeling;
                 source separation; Source separation; Speech; Speech
                 processing; STFT phase increment; STFT phase recovery;
                 time-domain analysis; time-domain signals;
                 Time-frequency analysis; Wiener filters; Wiener-like

  author =       "I. Kodrasi and S. Doclo",
  title =        "Analysis of Eigenvalue Decomposition-Based Late
                 Reverberation Power Spectral Density Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1106--1118",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "computational complexity; Dereverberation; eigenvalue
                 decomposition; eigenvalues and eigenfunctions;
                 Estimation error; estimation errors; EVD; EVD-based PSD
                 estimator; filtering theory; late reverberation power
                 spectral density estimation; late reverberation PSD
                 estimator; maximum likelihood based PSD estimator;
                 maximum likelihood estimation; Microphones; ML; ML
                 based PSD estimator; modeling errors; multichannel
                 methods; multichannel Wiener filter; Noise measurement;
                 prewhi-tening; PSD estimate; PSD estimation; relative
                 transfer functions; reverberant speech PSD matrix;
                 reverberation; Reverberation; Spatial coherence;
                 spatial coherence matrix; spectral analysis; Speech;
                 speech dereverberation techniques; speech processing;
                 transfer functions; Wiener filters",

  author =       "S. Braun and E. A. P. Habets",
  title =        "Linear Prediction-Based Online Dereverberation and
                 Noise Reduction Using Alternating {Kalman} Filters",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1119--1129",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; alternating Kalman
                 filters; alternating minimization; autoregressive
                 model; autoregressive processes; causality problem;
                 Dereverberation; Estimation; Fourier transforms; Kalman
                 filter; Kalman filters; MAR coefficients; Microphones;
                 multichannel autoregressive coefficients; multichannel
                 linear prediction; Noise reduction; noise-free
                 reverberant signals; online dereverberation; online
                 processing; optimal noise reduction; Reverberation;
                 reverberation; reverberation reduction; sequential
                 enhancement structures; short-time Fourier transform;
                 signal model; Speech; speech enhancement; Speech
                 processing; STFT domain; time-variant acoustic
                 scenarios; transient response",

  author =       "D. Ram and A. Asaei and H. Bourlard",
  title =        "Sparse Subspace Modeling for Query by Example Spoken
                 Term Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1130--1143",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "AMI database; deep neural network; Dictionaries;
                 dynamic programming; dynamic programming framework;
                 feature extraction; Feature extraction; low-dimensional
                 subspaces; MediaEval database; Mel frequency cepstral
                 coefficient; Neural networks; phone posterior features;
                 posterior probabilities; QbE-STD systems; query by
                 example; query by example spoken term detection; query
                 examples; query processing; query subspace; sparse
                 coding; sparse model recovery; sparse reconstruction
                 errors; sparse recovery modeling; sparse
                 representation; sparse structure; sparse subspace
                 modeling; Speech; Speech processing; speech processing;
                 spoken query; spoken term detection; standard template
                 matching; subspace detection; subspace regularization;
                 Task analysis; template matching likelihood; template
                 matching techniques; temporal structure; zero-resource

  author =       "M. Krawczyk-Becker and T. Gerkmann",
  title =        "On Speech Enhancement Under {PSD} Uncertainty",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1144--1153",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "available speech PSD estimates; Bayes methods;
                 Bayesian clean speech estimators; derived statistical
                 framework; Malah's amplitude estimators; Maximum
                 likelihood estimation; modern PSD estimators; musical
                 noise; Noise measurement; Noise reduction; novel
                 nonlinear clean speech estimator; power spectral
                 densities; power spectral density; PSD estimation
                 errors; PSD uncertainty; robust speech enhancement
                 performance; spectral analysis; Speech; Speech
                 enhancement; speech enhancement; speech estimation
                 errors; statistical analysis; typical speech PSDs;
                 Uncertainty; uncertainty; well-known conventional clean
                 speech estimators",

  author =       "S. Leglaive and R. Badeau and G. Richard",
  title =        "{Student}'s $t$-Source and Mixing Models for
                 Multichannel Audio Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1154--1168",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio signal processing; Audio source separation;
                 Bayes methods; Bayesian framework; blind source
                 separation; convolution; convolutive mixing process;
                 filtering theory; matrix decomposition; mixing filters;
                 multichannel audio source separation; multichannel
                 reverberant mixtures; Music; musical signals;
                 non-negative matrix factorization; nonnegative matrix
                 factorization model; Probabilistic logic; Random
                 variables; simple characteristic structure; simple
                 probabilistic priors; source separation; Source
                 separation; specific structure; statistical
                 distributions; statistical room acoustics; student t
                 distribution; student t source and mixing models;
                 Student's t distribution; Time-domain analysis;
                 Time-frequency analysis; time-frequency analysis;
                 time-frequency domain; transient response;
                 under-determined audio source separation; variational

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1169--1170",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "1171--1172",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "C3--C3",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "6",
  pages =        "C4--C4",
  month =        jun,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "C1--C1",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "C2--C2",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "1173--1174",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents [Edics]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "1175--1176",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Yoshimura and K. Hashimoto and K. Oura and Y.
                 Nankaku and K. Tokuda",
  title =        "Mel-Cepstrum-Based Quantization Noise Shaping Applied
                 to Neural-Network-Based Speech Waveform Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "1177--1184",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "approximation theory; cepstral analysis; Feature
                 extraction; filtering theory; human auditory
                 perception; mel-cepstral coefficients; mel-cepstrum;
                 mel-cepstrum-based quantization noise shaping method;
                 mel-log spectrum approximation filter; neural nets;
                 neural-network-based speech waveform synthesis system;
                 noise shaping; Noise shaping; quantisation (signal);
                 quantization; Quantization (signal); Speech; Speech
                 processing; speech quality; speech synthesis; Speech
                 waveform synthesis; synthetic speech; Vocoders;
                 WaveNet; WaveNet generative model; white noise; White
                 noise; white noise",

  author =       "Q. Wang and J. Du and L. Dai and C. Lee",
  title =        "A Multiobjective Learning and Ensembling Approach to
                 High-Performance Speech Enhancement With Compact Neural
                 Network Architectures",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "1185--1197",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "7-frame input expansion; cepstral analysis; clean
                 GFCC; clean LPS; clean MFCC; clean speech feature;
                 compact and low-latency design; compact DNNs; compact
                 neural network architectures; deep neural network
                 (DNN); deep neural network architecture; dynamic noise
                 feature; ensembling approach; estimated clean features;
                 feature extraction; Gaussian processes; hidden Markov
                 models; high-performance speech enhancement; IRM;
                 learned features; learning (artificial intelligence);
                 log-power spectra; lowlatency design; Mel frequency
                 cepstral coefficient; MOE-DNN; MOL-DNN; MOLE approach;
                 multiobjective ensembling; multiobjective ensembling
                 DNN; multiobjective learning; multiobjective learning
                 DNN; multiobjective set; multiple features; neural net
                 architecture; Neural networks; Noise measurement;
                 regression analysis; SE system; Speech; Speech
                 enhancement; speech enhancement; Speech enhancement
                 (SE); weak models; weak regression functions",

  author =       "M. {\'A}. Del-Agua and A. Gim{\'e}nez and A. Sanchis
                 and J. Civera and A. Juan",
  title =        "Speaker-Adapted Confidence Measures for {ASR} Using
                 Deep Bidirectional Recurrent Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "1198--1206",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Adaptation models; ASR; automatic speech recognition;
                 Automatic speech recognition; Computer architecture;
                 confidence estimation; confidence measures; DBLSTM;
                 DBRNN; deep bidirectional recurrent neural networks;
                 English LibriSpeech; long short-term memory; long
                 short-term memory cells; natural language processing;
                 nonadapted confidence measures; recurrent neural nets;
                 Recurrent neural networks; recurrent neural
                 networks-based confidence classifiers; RNN; Spanish
                 PoliMedia tasks; speaker adaptation; speaker-adapted
                 confidence measures; Speech; speech corpus; Speech
                 processing; speech recognition; Task analysis; TED-LIUM
                 corpus; Training; unsupervised adaptation method",

  author =       "J. Proen{\c{c}}a and C. Lopes and M. Tjalve and A.
                 Stolcke and S. Candeias and F. Perdig{\~a}o",
  title =        "Mispronunciation Detection in Children's Reading of
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "1207--1219",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "automatic assessment; automatic reading annotation;
                 automatic reading tutors; automatic segmentation;
                 candidate segmentation; candidate word pronunciations;
                 children sentence reading; children's reading; correct
                 pronunciation; Decoding; Electronic mail; feature
                 extraction; Grammar; Hidden Markov models;
                 log-likelihood ratio; manual segmentation; Measurement;
                 mispronunciation classification; mispronunciation
                 detection; natural language processing; phoneme
                 recognition approaches; segmentation stage; Speech;
                 Speech analysis; spotting approach; Task analysis; word
                 candidates; word pronunciation; word spotting model",

  author =       "Ljubi{\v{s}}a Stankovi{\'c} and Milo{\v{s}}
  title =        "Analysis of the Reconstruction of Sparse Signals in
                 the {DCT} Domain Applied to Audio Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "1220--1235",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "approximately sparse signals; audio signal processing;
                 Audio signals; compressed sensing; compressive sensing
                 methods; computationally efficient reconstruction
                 algorithm; DCT coefficients; DCT domain; digital signal
                 processing; discrete cosine transform; discrete cosine
                 transforms; Discrete cosine transforms; Discrete
                 Fourier transforms; disturbance scenarios; experimental
                 signals; mean square error methods; mean-square
                 reconstruction error; nonsparse noisy signals; recorded
                 audio signals; reduced set; signal reconstruction;
                 signal representation; signal samples; signal sampling;
                 sparse audio signal processing; sparse signal
                 processing; Speech; Speech processing; statistical
                 properties; synthetic signals; unique reconstruction

  author =       "J. F. Santos and T. H. Falk",
  title =        "Speech Dereverberation With Context-Aware Recurrent
                 Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "1236--1246",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "architectural acoustics; context information; Context
                 modeling; context-aware recurrent neural networks;
                 Convolution; convolutional codes; convolutional
                 encoder; deep learning; Dereverberation; Feature
                 extraction; feature extraction; high reverberation
                 times; long-term dependencies; long-term information;
                 perceived reverberation; perceptual evaluation;
                 perceptual objective listening quality assessment;
                 recurrent neural nets; recurrent neural network;
                 recurrent neural networks; reverberant counterpart;
                 reverberant speech; Reverberation; reverberation;
                 reverberation time; short-time objective
                 intelligibility; simulated room impulse responses;
                 spectral magnitude; Speech; speech coding; speech
                 dereverberation; speech enhancement; Speech
                 enhancement; speech intelligibility; speech quality;
                 Time-frequency analysis",

  author =       "M. Geronazzo and S. Spagnol and F. Avanzini",
  title =        "Do We Need Individual Head-Related Transfer Functions
                 for Vertical Localization? The Case Study of a Spectral
                 Notch Distance Metric",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "1247--1260",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustics; anthropometry; audio signal processing;
                 auditory elevation perception; auditory model; auditory
                 models; Computational modeling; Databases; dummy-head
                 HRTF; head-related transfer function rendering process;
                 head-related transfer functions (HRTFs); hearing; HRTF
                 selection; HRTF spectra; image processing; individual
                 head-related transfer functions; individualized HRTFs;
                 nonindividual HRTF set; personalized HRTF set;
                 Psychoacoustic models; psychoacoustically motivated
                 anthropometry based mismatch function; random HRTF
                 selection; rendering (computer graphics); Spatial
                 audio; spectral notch distance; spectral notch metric;
                 Speech; Speech processing; transfer functions; Transfer
                 functions; vertical localization",

  author =       "D. Marquardt and S. Doclo",
  title =        "Interaural Coherence Preservation for Binaural Noise
                 Reduction Using Partial Noise Estimation and Spectral
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "1261--1274",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "array signal processing; Auditory system; beamforming;
                 binaural cues; binaural multichannel Wiener filter;
                 binaural MVDR beamformer; binaural MWF; binaural noise
                 reduction; binaural speech enhancement algorithms;
                 closed-form expression; Coherence; computational
                 complexity; diffuse noise scenarios; Distortion;
                 estimation theory; hearing aids; Integrated circuits;
                 interaural coherence; interaural coherence
                 preservation; Microphones;
                 minimum-variance-distortionless response; Multi-channel
                 Wiener filter; MVDR-IC; MVDR-N; MWF-IC; MWF-N; noise
                 reduction; Noise reduction; noise reduction
                 performance; partial noise estimation;
                 quasidistortionless version; signal denoising; single
                 desired speech source; spectral postfilter; Speech;
                 speech enhancement; undesired noise component; Wiener

  author =       "M. Farmani and M. S. Pedersen and Z. Tan and J.
  title =        "Bias-Compensated Informed Sound Source Localization
                 Using Relative Transfer Functions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "1275--1289",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; ambient noise
                 characteristics; bias-compensated informed sound source
                 localization; binaural configurations; binaural
                 microphone array configurations; computational
                 complexity; Databases; direction of arrival estimation;
                 direction-of-arrival estimation; Direction-of-arrival
                 estimation; DoA estimator; DoA-dependent relative
                 transfer functions; HA microphones; hearing aid;
                 hearing aid system; hearing aids; Hearing aids;
                 information fusion strategy; lower computational
                 complexity; maximum likelihood; Maximum likelihood
                 estimation; maximum likelihood estimation;
                 maximum-likelihood approach; microphone arrays;
                 microphone signals; Microphones; monaural microphone
                 array configurations; noise-free target speech;
                 received signals; relative transfer function;
                 reverberation; sensor fusion; shadowing effect; Sound
                 source localization; Speech; target sound direction;
                 transfer functions; Wireless communication; wireless
                 microphone informs the HA system",

  author =       "F. Tao and C. Busso",
  title =        "Gating Neural Network for Large Vocabulary Audiovisual
                 Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "1290--1302",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio-visual systems; audiovisual automatic speech
                 recognition; audiovisual CRSS-4ENGLISH-14 corpus;
                 Audiovisual large vocabulary automatic speech
                 recognition; audiovisual perception process; AV-ASR;
                 complementary information; deep learning solution;
                 Feature extraction; gating layer; gating neural
                 network; Gaussian processes; hidden Markov models;
                 Hidden Markov models; human interactions; hybrid
                 system; learning (artificial intelligence); Machine
                 learning; Multimodal deep learning; multistream HMM
                 system; neural nets; Noise measurement; noisy
                 conditions; noisy features; observation models;
                 real-world applications; Speech; speech recognition;
                 Speech recognition; speech recognition; uninformative
                 visual features; visual cues; Visualization;
                 vocabulary; vocabulary audiovisual speech recognition",

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "1303--1304",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "1305--1306",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "C3--C3",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "7",
  pages =        "C4--C4",
  month =        jul,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "C1--C1",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "C2--C2",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "1303--1304",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents [Edics]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "1305--1306",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Z. Rafii and A. Liutkus and F. St{\"o}ter and S. I.
                 Mimilakis and D. FitzGerald and B. Pardo",
  title =        "An Overview of Lead and Accompaniment Separation in
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "1307--1335",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "accompaniment; accompaniment separation; audio signal
                 processing; automatic karaoke; data-centered
                 approaches; deep learning; Lead; lead; lead component;
                 lead separation systems; lead signal; learning
                 (artificial intelligence); model-based methods; music;
                 Music; music separation; musical structures;
                 musicology; overview; particular complexity; particular
                 difficulty; popular music; popular topic; relevant
                 prior knowledge; remixing; Source separation; source
                 separation; source separation yields; Spectrogram;
                 Speech; Speech processing; Time-frequency analysis",

  author =       "C. Wang and J. Wang and A. Santoso and C. Chiang and
                 C. Wu",
  title =        "Sound Event Recognition Using Auditory-Receptive-Field
                 Binary Pattern and Hierarchical-Diving Deep Belief
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "1336--1351",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio signal processing; audio-visual descriptor;
                 Auditory receptive fields binary patterns;
                 auditory-receptive-field binary pattern; automatic
                 sound event recognition; belief networks; cepstral
                 analysis; cepstral features; classification method;
                 Data mining; deep neural network system; environmental
                 sound; feature extraction; Feature extraction; Hidden
                 Markov models; hierarchical diving deep belief network;
                 hierarchical-diving deep belief network; human auditory
                 receptive field model; image classification; image
                 representation; neural nets; Neural networks; physical
                 feature representation; practical SER system; sound
                 event classification; sound event detection;
                 Spectrogram; spectrogram image feature; Speech; speech
                 recognition; Speech recognition",

  author =       "L. Yang and M. Zhang and Y. Liu and M. Sun and N. Yu
                 and G. Fu",
  title =        "Joint {POS} Tagging and Dependence Parsing With
                 Transition-Based Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "1352--1358",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Artificial neural networks; dependence parsing;
                 dependency parsing; Dependency parsing; feature
                 sparsity; grammars; joint model; joint modeling;
                 Labeling; labeling conflicts; natural language
                 processing; natural languages; Natural languages;
                 neural nets; neural network based classifiers; neural
                 networks; part-of-speech tagging; pattern
                 classification; POS tagging; shift-reduce conflicts;
                 Speech; Syntactics; Tagging; tagging conflicts;
                 transition-based neural networks",

  author =       "K. Yu and Z. Zhao and X. Wu and H. Lin and X. Liu",
  title =        "Rich Short Text Conversation Using
                 Semantic-Key-Controlled Sequence Generation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "1359--1368",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "chatbot; controllable memory trigger; Data models;
                 Decoding; external-memory tensor; learning (artificial
                 intelligence); Logic gates; natural language
                 processing; Question and answer;
                 semantic-key-controlled sequence generation; Semantics;
                 semantics; sequence to sequence learning;
                 sequence-to-sequence learning approach;
                 sequence-to-sequence model; sequence-to-sequence
                 training; sequences; short text conversation; short
                 text conversation (STC); Speech; Speech processing;
                 STC; text analysis; Training",

  author =       "B. Lehner and J. Schl{\"u}ter and G. Widmer",
  title =        "Online, Loudness-Invariant Vocal Detection in Mixed
                 Music Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "1369--1380",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; Feature extraction; Hidden
                 Markov models; human singing voice expressive richness;
                 human singing voice timbral richness; Instruments;
                 interfering instrumental accompaniment; learning
                 (artificial intelligence); long short-term memory
                 recurrent neural network classifier; loudness;
                 LSTM-RNN; machine learning; mixed music signals; music;
                 music information retrieval; music recording; neural
                 network; online loudness-invariant vocal detection;
                 recurrent neural nets; signal classification; Singing
                 voice detection; singing voice detection; sound
                 production system; Spectrogram; Speech; Speech
                 processing; Task analysis; VD; voice activity

  author =       "S. Stone and M. Marxen and P. Birkholz",
  title =        "Construction and Evaluation of a Parametric
                 One-Dimensional Vocal Tract Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "1381--1392",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "aero-acoustic simulations; articulatory speech
                 synthesis; articulatory synthesis; Computational
                 modeling; consonant recognition rate; Electron tubes;
                 German consonants; German vowels; higher dimensional
                 vocal tract model; Larynx; mean square error methods;
                 minimum root-mean-square error; onedimensional vocal
                 tract area function; parametric one-dimensional vocal
                 tract model; reference area functions; Shape; Solid
                 modeling; Speech; speech production; speech
                 recognition; speech synthesis; Three-dimensional
                 displays; Vocal tract models; vocal tract shapes; vowel
                 recognition rate",

  author =       "T. Tan and Y. Qian and H. Hu and Y. Zhou and W. Ding
                 and K. Yu",
  title =        "Adaptive Very Deep Convolutional Residual Network for
                 Noise Robust Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "1393--1405",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic modeling; Adaptation models; adaptive very
                 deep convolutional residual network; additive noise;
                 advanced model; AMI; Aurora4; automatic speech
                 recognition; canonical model; CAT; Cats; channel
                 distortion; CHiME4; cluster adaptive training;
                 convolutional neural network; deep convolutional neural
                 networks; different noisy conditions; factor aware
                 training; FAT; feedforward neural nets; model
                 adaptation; Noise measurement; noise robust speech
                 recognition; noisy environments; noisy scenarios;
                 performance degradation; real noisy data; residual
                 learning; reverberation; Robust speech recognition;
                 simulated data; Speech; Speech recognition; speech
                 recognition; superior noise robustness; system
                 performance; Task analysis; testing conditions;
                 Training; transcription task; VDCRN; WER; word error

  author =       "X. Wang and S. Takaki and J. Yamagishi",
  title =        "Autoregressive Neural {F0} Model for Statistical
                 Parametric Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "1406--1419",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Artificial neural networks; autoregressive model;
                 autoregressive neural F0 model; conventional mean-based
                 generation method; DAR; data dropout strategies; Data
                 models; F0; F0 contours; F0 datum; Feature extraction;
                 Fundamental frequency; fundamental frequency models;
                 Hidden Markov models; Linguistics; neural network;
                 noisy F0 contours; nonlinear AR dependency; normal RNN;
                 pitch; recurrent neural nets; recurrent neural
                 networks; SAR; shallow autoregressive recurrent mixture
                 density network; Speech; speech synthesis; statistical
                 dependency; statistical parametric speech synthesis;
                 temporal dependency; text-to-speech synthesis",

  author =       "C. Valentini-Botinhao and J. Yamagishi",
  title =        "Speech Enhancement of Noisy and Reverberant Speech for
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "1420--1433",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "additive noise data; clean data; dereverberation;
                 enhanced synthetic voice; environmental noise;
                 event-based scheduling; Feature extraction; generalized
                 closed skew normal distribution; Noise measurement;
                 noise suppression; noise-only case; noisy recordings;
                 parallel data; recurrent neural nets; recurrent neural
                 network; Remote state estimation; reverberant
                 recordings; reverberant speech; Reverberation;
                 reverberation; Speech; speech enhancement; Speech
                 enhancement; speech enhancement methods; studio-quality
                 recordings; text-to-speech text-to-speech; Training",

  author =       "A. I. Koutrouvelis and T. W. Sherson and R. Heusdens
                 and R. C. Hendriks",
  title =        "A Low-Cost Robust Distributed Linearly Constrained
                 Beamformer for Wireless Acoustic Sensor Networks With
                 Arbitrary Topology",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "1434--1448",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "arbitrary distributed network topologies; array signal
                 processing; cross power spectral density matrix;
                 Distributed beamforming; Estimation error; filtering
                 theory; LCMV; linear equality constraints; matrix
                 algebra; Microphones; MVDR; Network topology; Noise
                 measurement; optimisation; optimization problem;
                 relative acoustic transfer function estimation errors;
                 Reverberation; robust beamforming; robust distributed
                 linearly constrained beamformer; Robustness; speech
                 enhancement; WASN; wireless acoustic sensor network;
                 wireless sensor networks",

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "1449--1450",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "1451--1452",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "C3--C3",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "8",
  pages =        "C4--C4",
  month =        aug,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "C1--C1",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "C2--C2",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1453--1454",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents [Edics]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1455--1456",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "C. Wu and C. Dittmar and C. Southall and R. Vogl and
                 G. Widmer and J. Hockman and M. M{\"u}ller and A.
  title =        "A Review of Automatic Drum Transcription",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1457--1483",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "ADT research; ADT systems; ADT techniques; automatic
                 drum transcription; automatic music transcription;
                 classification; computational methods; deep learning;
                 drum part; drum sound events; drum-specific variations;
                 information retrieval; Instruments; machine learning;
                 matrix decomposition; matrix factorization; music;
                 Music information retrieval; music information
                 retrieval; musical style; nonnegative matrix
                 factorization; pattern classification; percussion;
                 recorded music; recurrent neural nets; Rhythm;
                 rhythm-related music processing tasks; Spectrogram;
                 Speech processing; state-of-the-art systems; Task
                 analysis; task-specific challenges; Transient analysis;
                 umbrella term automatic drum transcription; Western
                 popular music",

  author =       "C. Evers and P. A. Naylor",
  title =        "Acoustic {SLAM}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1484--1498",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "accurate positional information; acoustic generators;
                 Acoustic scene mapping; acoustic signal processing;
                 acoustic signals; Acoustic Simultaneous Localization;
                 Acoustic SLAM; acoustic sources; array signal
                 processing; Bayes methods; consequent false DoA
                 estimates; Direction-of-Arrival; Direction-of-arrival
                 estimation; direction-of-arrival estimation; inactivity
                 lead; microphones; missing DoA estimates; multiple
                 sound sources; observer motion; Observers; positional
                 source information; Probability density function;
                 Reverberation; reverberation; robot audition; scene
                 map; Simultaneous localization and mapping;
                 simultaneous localization and mapping; SLAM (robots);
                 sound source localization accuracy; source directions;
                 source location estimation; source-sensor range;
                 Speech; three-dimensional representation",

  author =       "C. Laroche and M. Kowalski and H. Papadopoulos and G.
  title =        "Hybrid Projective Nonnegative Matrix Factorization
                 With Drum Dictionaries for Harmonic\slash Percussive
                 Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1499--1511",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio signal; audio signal processing; audio source
                 separation; blind source separation; Dictionaries; drum
                 dictionaries; Harmonic analysis; harmonic source
                 separation algorithms; harmonic/percussive
                 decomposition; hybrid projective nonnegative matrix
                 factorization; Instruments; matrix decomposition;
                 Matrix decomposition; Multiple signal classification;
                 multiplicative update rules; Music; music; music
                 database; music signals; Nonnegative matrix
                 factorization; orthogonal nonnegative decomposition;
                 percussive source separation algorithms; projective
                 nonnegative matrix factorization; short-term broadband
                 sounds; signal representation; signal time frequency
                 representation decomposition; smooth spectra prelearned
                 dictionary; source separation; Source separation;
                 sparse decomposition; sparse nonnegative decomposition;
                 straightforward NMF decomposition; tonal part;
                 transient part",

  author =       "J. J. Carabias-Orti and J. Nikunen and T. Virtanen and
                 P. Vera-Candeas",
  title =        "Multichannel Blind Sound Source Separation Using
                 Spatial Covariance Model With Level and Time
                 Differences and Nonnegative Matrix Factorization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1512--1527",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "achieved separation performance; audio signal
                 processing; blind source separation; complex-valued
                 nonnegative matrix factorization; covariance matrices;
                 Covariance matrices; direction of arrival estimation;
                 Direction-of-arrival estimation; direction-of-arrival
                 estimation; direction-of-arrival kernels; DOA kernels;
                 Euclidean distance; explicit modeling; interaural level
                 difference; interaural time difference; Itakura-Saito
                 divergence; Kernel; level difference covariance
                 matrices; level differences; magnitude spectrograms;
                 matrix decomposition; Microphones; microphones;
                 multichannel blind sound source separation;
                 Multichannel source separation; NMF model; non-negative
                 matrix factorization; phase difference covariance
                 matrices; predefined source directions; reverberation;
                 SCM model; source localization; Source separation;
                 source spatial covariance matrices; spatial covariance
                 model; spatial properties; Spectrogram; time
                 differences; Time-frequency analysis; two-channel SiSEC
                 development dataset",

  author =       "M. Zhang and N. Yu and G. Fu",
  title =        "A Simple and Effective Neural Model for Joint Word
                 Segmentation and {POS} Tagging",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1528--1538",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Bidirectional control; Chinese natural language
                 processing; Chinese word segmentation; Decoding; joint
                 model; joint word segmentation; learning (artificial
                 intelligence); long short term memory neural network
                 structures; Natural language processing; natural
                 language processing; neural joint model; neural nets;
                 Neural networks; neural networks; POS tagging;
                 Predictive models; sequence-to-sequence neural model;
                 Tagging; Task analysis; transition system; well-defined
                 transition system",

  author =       "D. Menzies and F. M. Fazi",
  title =        "A Complex Panning Method for Near-Field Imaging",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1539--1548",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "adaptive panning method; Augmented reality; complex
                 panning method; conventional amplitude panning; distant
                 objects; Ear; extended panning method; Frequency
                 control; Frequency-domain analysis; head orientation;
                 hearing; image direction; Imaging; Inter-aural Level
                 Difference cues; loudspeakers; Loudspeakers; near-field
                 image; near-field region; single first order filter;
                 spatial audio; Speech processing; stereo; stereo image
                 processing; stereo panning functions; tangent law;
                 transfer functions; VBAP",

  author =       "A. Misra and J. H. L. Hansen",
  title =        "Maximum-Likelihood Linear Transformation for
                 Unsupervised Domain Adaptation in Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1549--1558",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "domain adaptation; EM algorithm;
                 expectation-maximisation algorithm;
                 expectation-maximization algorithm; front-end factor
                 analysis; Gaussian mixture model; Gaussian processes;
                 GMM; i-Vector space; in-domain development data;
                 maximum-likelihood linear transformation; mixture
                 models; National Institute of Standards and Technology
                 Speaker Recognition Evaluation; optimisation;
                 optimization process; out-of-domain development data;
                 probability; probability density estimation problem;
                 speaker recognition; speaker recognition evaluation;
                 Speaker verification; SRE-2016 corpus; transforms;
                 unsupervised domain adaptation; unsupervised
                 probabilistic feature transformation parameters; UPFT;

  author =       "Y. Wakabayashi and T. Fukumori and M. Nakayama and T.
                 Nishiura and Y. Yamashita",
  title =        "Single-Channel Speech Enhancement With Phase
                 Reconstruction Based on Phase Distortion Averaging",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1559--1569",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "amplitude spectrum; Discrete Fourier transforms;
                 fundamental frequency; Harmonic analysis; harmonic
                 enhancement; harmonic phase spectra; harmonic
                 structure; Noise measurement; phase distortion; phase
                 distortion averaging; phase distortion feature; Phase
                 reconstruction; phase reconstruction method;
                 Reconstruction algorithms; signal reconstruction;
                 single-channel speech enhancement; Speech enhancement;
                 speech enhancement; speech phase spectrum; speech
                 quality; speech signal; Time-frequency analysis;
                 time-frequency analysis",

  author =       "S. Fu and T. Wang and Y. Tsao and X. Lu and H. Kawai",
  title =        "End-to-End Waveform Utterance Enhancement for Direct
                 Evaluation Metrics Optimization by Fully Convolutional
                 Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1570--1584",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Automatic speech recognition; automatic speech
                 recognition system; clean speech; direct evaluation
                 metrics optimization; end-to-end speech enhancement;
                 end-to-end utterance-based speech enhancement
                 framework; end-to-end waveform utterance enhancement;
                 evaluation criterion; FCN enhancement framework; fully
                 convolutional neural network; fully convolutional
                 neural networks; learning (artificial intelligence);
                 Linear programming; long speech segments; mean square
                 error; mean square error methods; model optimization
                 criterion; MSE-optimized speech; neural nets; Noise
                 measurement; noisy speech; optimisation; Optimization;
                 perception-based objective function; raw waveform;
                 short-time objective intelligibility measure; Speech;
                 Speech enhancement; speech enhancement; speech
                 intelligibility; speech recognition; STOI measure;
                 temporal correlation information; Training; training

  author =       "K. Xiao and S. Wang and M. Wan and L. Wu",
  title =        "Radiated Noise Suppression for Electrolarynx Speech
                 Based on Multiband Time-Domain Amplitude Modulation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1585--1593",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic characteristics; amplitude modulation;
                 artificial noise; EL speech; electrolarynx speech;
                 Electrolarynx speech; enhancement; MTAM; multiband
                 time-domain amplitude modulation; perceptual
                 characteristics; radiated noise; radiated noise
                 suppression; residual noise intensity; speech
                 components; speech enhancement; speech intelligibility;
                 speech quality; time-domain amplitude modulation;
                 Wiener filters",

  author =       "A. Fahim and P. N. Samarasinghe and T. D. Abhayapala",
  title =        "{PSD} Estimation and Source Separation in a Noisy
                 Reverberant Environment Using a Spherical Microphone
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1594--1607",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "array signal processing; Bessel functions; coherent
                 background noise; Correlation; Estimation; Harmonic
                 analysis; individual power spectral density components;
                 inherent orthogonality; microphone arrays; Microphone
                 arrays; multisource reverberant sound scene; Noise
                 measurement; Noise suppression; power spectral density;
                 PSD components; PSD estimation; Reverberation;
                 reverberation; source separation; speech
                 dereverberation; spherical harmonics basis functions;
                 spherical harmonics domain; spherical microphone

  author =       "H. He and J. Chen and J. Benesty and T. Yang",
  title =        "Noise Robust Frequency-Domain Adaptive Blind
                 Multichannel Identification With$ \ell_p$-Norm
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1608--1619",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "$\ell _p$-norm penalty; -norm constraint; acoustic
                 communication (telecommunication); acoustic signal
                 processing; Acoustics; adaptive filter; adaptive
                 filters; Blind multichannel identification; blind
                 source separation; channel estimation; Cost function;
                 frequency-domain adaptive filtering; frequency-domain
                 analysis; Frequency-domain analysis; least mean squares
                 methods; noise robust frequency-domain adaptive blind
                 multichannel identification; noise-free environments;
                 RNMCFLMS algorithm; robust normalized multichannel
                 frequency-domain least mean square algorithm;
                 Robustness; robustness; Signal processing algorithms;
                 SIMO system; single-input multiple-output acoustic
                 system; sparsity; spectral flatness constraint; Speech
                 processing; Time-domain analysis; transient response",

  author =       "W. Zhang and Z. Chen and F. Yin and Q. Zhang",
  title =        "Melody Extraction From Polyphonic Music Using Particle
                 Filter and Dynamic Programming",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1620--1632",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; audio signal processing;
                 Bayes methods; Bayesian filtering; Bayesian filtering
                 framework; constant-Q transform; Data mining; Dynamic
                 programming; dynamic programming; feature extraction;
                 frame-wise pitches; Harmonic analysis; information
                 retrieval; instrumental melodies; melodic contour;
                 Melody extraction; melody extraction method;
                 multiresolution spectral analysis; music; music
                 information; Music information retrieval; music
                 information retrieval; music information retrieval
                 community; particle filter; particle filtering
                 (numerical methods); pitch transition probability;
                 polyphonic music; probability; publicly available
                 dataset; rough melody contour; spectral analysis;
                 statistical analysis; Timbre; vocal melodies",

  author =       "C. Zhang and K. Koishida and J. H. L. Hansen",
  title =        "Text-Independent Speaker Verification Based on Triplet
                 Convolutional Neural Network Embeddings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1633--1644",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "channel variabilities compensation; conventional
                 speaker recognition pipelines; deep neural networks;
                 end-to-end fashion; Euclidean distance; Euclidean
                 distance similarity metric; feature extraction; feature
                 representation; feedforward neural nets; fixed-length
                 input constraint; fixed-length input speaker embedding
                 system; fixed-length speaker discriminative embedding;
                 front-end speaker; i-vector; Inception-Resnet-v1
                 architecture; learning (artificial intelligence);
                 network training; neural network based speaker
                 discriminative training; Neural networks; NIST; noise
                 variabilities compensation; novel text-independent
                 speaker verification framework; performance gain; PLDA;
                 probabilistic linear discriminant analysis; severe test
                 condition mismatches; severe training condition
                 mismatches; sparse speech features; spatial pyramid
                 pooling; spatial pyramid pooling layer; Speaker
                 recognition; speaker recognition; Speech processing;
                 statistical analysis; SV system; SV task; SV testing;
                 system performance; Task analysis; testing performance;
                 Training; triplet convolutional neural network
                 embeddings; triplet loss; very deep convolutional
                 neural network architecture; very deep convolutional
                 neutral networks",

  author =       "A. R. MV and P. K. Ghosh",
  title =        "{PSFM} A Probabilistic Source Filter Model for Noise
                 Robust Glottal Closure Instant Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1645--1657",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "all-pole filter coefficients; archivable priority list
                 actual-word database database; Bernoulli Gaussian
                 distribution; clean speech; computational complexity;
                 database management systems; Dynamic programming;
                 dynamic programming; exact GCI locations; filtering
                 theory; Gaussian distribution; GCI detection; Gibbs
                 sampling; glottal inverse filtering; Heuristic
                 algorithms; N-best dynamic programming; noise robust
                 GCI detection technique; noise robust glottal closure
                 instant detection; Noise robustness; pathological
                 speech; pitch synchronous speech analysis;
                 Probabilistic logic; probabilistic source-filter model;
                 probability; prosody modifications; PSFM; second-order
                 statistics; Signal to noise ratio; signal-to-noise
                 ratio levels; Speech processing; speech processing;
                 voiced speech",

  author =       "M. Airaksinen and L. Juvela and B. Bollepalli and J.
                 Yamagishi and P. Alku",
  title =        "A Comparison Between {STRAIGHT}, Glottal, and
                 Sinusoidal Vocoding in Statistical Parametric Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1658--1670",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; Acoustics;
                 analysis-synthesis; crowd-sourced listening test;
                 formal test; glottal vocoding; GlottDNN; mixed
                 excitation vocoders; PML; Predictive models;
                 Production; pulse model in log-domain; shared envelope
                 model; sinusoidal vocoding; speech coding; Speech
                 synthesis; speech synthesis; Speech synthesis; speech
                 waveform; statistical analysis; statistical parametric
                 speech synthesis; statistical parametric speech
                 synthesis framework; straight vocoding; synthesized
                 speech quality; text-to-speech synthesis; Transfer
                 functions; TTS synthesis; vocoder; vocoder quality;
                 vocoder-specific features; vocoders; Vocoders; waveform
                 generation method",

  author =       "G. Mah{\'e} and M. Ja{\"\i}dane",
  title =        "Perceptually Controlled Reshaping of Sound
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1671--1683",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio processing algorithms; audio signal processing;
                 filtering theory; flat-spectrum version; frequency
                 masking model; Frequency-domain analysis; generic
                 algorithm; HGR; histogram global reshaping; histogram
                 local reshaping; histogram low-pass filtering;
                 Histograms; inaudible noise; iterative methods;
                 low-pass filtering; low-pass filters; low-power white
                 noise; noise audibility; noise audibility control;
                 optimal performance; quantisation (signal);
                 Quantization (signal); quantization theorem; Shape;
                 signal-plus-noise mixture; Sound histogram
                 equalization; sound histograms; sound reshaping; Source
                 separation; source separation; sparsification; specific
                 signal statistical distributions; Speech processing;
                 statistical distributions; target histogram;
                 Time-domain analysis; white noise",

  author =       "Q. Huang and L. Zhang and Y. Fang",
  title =        "Two-Step Spherical Harmonics {ESPRIT}-Type Algorithms
                 and Performance Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1684--1697",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "array signal processing; complex spherical harmonics
                 domain; computational complexity; decomposition;
                 Direction-of-arrival (DOA) estimation;
                 direction-of-arrival estimation; DOA estimation;
                 eigenvalue decomposition; eigenvalues and
                 eigenfunctions; esti-mation of signal parameter via
                 rotational invariance technique (ESPRIT); EVD;
                 high-resolution estimation of signal parameter via
                 rotational invariance technique; matrix algebra; mean
                 square error (MSE); mean square error methods; mean
                 square errors; MSE; parameter estimation; real-valued
                 two-step SHESPRIT; semiRTS-SHESPRIT method; signal
                 resolution; spherical array; spherical arrays;
                 TS-SHESPRIT; two-step method; two-step spherical
                 harmonics ESPRIT-type algorithms; unitary

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1698--1699",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "1700--1702",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "C3--C3",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "9",
  pages =        "C4--C4",
  month =        sep,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "C1--C1",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "C2--C2",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1698--1699",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents [Edics]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1700--1701",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D. Wang and J. Chen",
  title =        "Supervised Speech Separation Based on Deep Learning:
                 an Overview",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1702--1726",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "array separation; beamforming; deep learning; deep
                 neural networks; Interference; learning (artificial
                 intelligence); multitalker separation; Noise
                 measurement; Seech separation; speaker separation;
                 speech dereverberation; Speech enhancement; speech
                 enhancement; speech intelligibility; speech-nonspeech
                 separation; Supervised learning; supervised learning
                 problem; supervised separation algorithms; supervised
                 speech separation; target speech; Task analysis;
                 time-frequency masking; Training",

  author =       "R. Wang and M. Utiyama and A. Finch and L. Liu and K.
                 Chen and E. Sumita",
  title =        "Sentence Selection and Weighting for Neural Machine
                 Translation Domain Adaptation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1727--1741",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Adaptation models; conventional phrase-based machine
                 translation; Decoding; domain adaptation; domain
                 adaptation techniques; domain tags; domain weighting;
                 domain-specific tasks; dynamic training methods;
                 in-domain corpus; language translation; learning
                 (artificial intelligence); machine translation tasks;
                 multidomain sentence; natural language processing;
                 Neural machine translation; neural machine translation
                 domain adaptation; NMT domain problem; NMT internal
                 sentence embedding; NMT performance; NMT training;
                 out-of-domain corpora; out-of-domain sentences;
                 real-world NMT scenario; sentence embedding similarity;
                 sentence level NMT domain adaptation; sentence
                 selection; sentence weighting methods; Speech
                 processing; statistical analysis; Task analysis;
                 Testing; Training; Training data; translation

  author =       "F. U. Khan and B. P. Milner and T. {Le Cornu}",
  title =        "Using Visual Speech Information in Masking Methods for
                 Audio Speaker Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1742--1754",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio feature space; audio information; audio mask;
                 audio ratio; audio signal processing; audio speaker
                 separation; audio-masking-based speaker separation;
                 audio-visual masking methods; audio-visual masks;
                 audio-visual processing; audio-visual ratio masks;
                 binary masks; Cameras; deep neural network; Estimation;
                 feature extraction; Feature extraction; intelligibility
                 tests; Lips; masking methods; neural nets; ratio mask;
                 speaker recognition; Speaker separation; speech
                 intelligibility; speech mixture; speech processing;
                 Speech processing; speech quality; target speech;
                 Time-frequency analysis; visual information; visual
                 speech features; visual speech information; visual-only
                 methods; Visualization; visually derived binary mask
                 estimation; visually derived ratio mask estimation",

  author =       "X. Li and S. Gannot and L. Girin and R. Horaud",
  title =        "Multichannel Identification and Nonnegative
                 Equalization for Dereverberation and Noise Reduction
                 Based on Convolutive Transfer Function",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1755--1768",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; additive noise; Additive
                 noise; Blind equalizers; blind multichannel
                 identification; blind room impulse response
                 identification; blind source separation; common zeros
                 problem; complex-valued convolution model;
                 complex-valued CTFs; convolution; Convolution;
                 convolutive transfer function; CTF magnitude;
                 dereverberation; equalisers; filtering theory; Fourier
                 transforms; frequency aliasing; frequency response;
                 Frequency response; joint speech dereverberation; long
                 impulse responses; Microphones; microphones;
                 multichannel equalization; Multichannel identification;
                 near-common zeros; noise power related tolerance; Noise
                 reduction; noise reduction; nonflat frequency response;
                 nonnegative convolution model; nonnegative
                 equalization; nonnegative multichannel equalization
                 method; oversampled signals; oversampled STFT;
                 reverberation; short-time Fourier; signal sampling;
                 source signal; STFT framework; STFT magnitude; STFT
                 window; Time-domain analysis; time-domain analysis;
                 time-domain cross-relation method; time-domain impulse
                 response; transfer functions; transient response",

  author =       "L{\"u}tfi Kerem {\c{S}}enel and {\.I}hsan Utlu and
                 Veysel Y{\"u}cesoy and Aykut Ko{\c{c}} and Tolga
  title =        "Semantic Structure and Interpretability of Word
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1769--1779",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Interpretability; latent semantic structure; natural
                 language processing; Natural language processing;
                 natural language processing; NLP; semantic relations;
                 semantic structure; Semantics; Sparse matrices; Speech
                 processing; Standards; Statistical analysis; Task
                 analysis; vector spaces; word embeddings; word
                 embeddings interpretability; word intrusion test",

  author =       "Y. Koizumi and K. Niwa and Y. Hioka and K. Kobayashi
                 and Y. Haneda",
  title =        "{DNN}-Based Source Enhancement to Increase Objective
                 Sound Quality Assessment Score",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1780--1792",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "backpropagation; black-box-optimization scheme; deep
                 learning; deep neural network based source enhancement;
                 DNN optimization scheme; Estimation; gradient methods;
                 high OSQA scores; high-quality output signals; learning
                 (artificial intelligence); Linear programming; mean
                 square error methods; neural nets; objective sound
                 quality assessment (OSQA) score; objective sound
                 quality assessment score; optimisation; Optimization;
                 policy gradient method; probability; Quality
                 assessment; sound-quality evaluation; Sound-source
                 enhancement; speech enhancement; Speech processing;
                 Time-frequency analysis; time-frequency mask;

  author =       "C. Paleologu and J. Benesty and S. Ciochin{\u{a}}",
  title =        "Linear System Identification Based on a {Kronecker}
                 Product Decomposition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1793--1808",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic impulse responses; acoustic signal
                 processing; approximation theory; Convergence; echo
                 cancelation perspective; echo cancelers; echo
                 cancellation; Echo cancellers; echo paths; echo
                 suppression; filtering theory; identification; impulse
                 response decomposition; iterative algorithm; Iterative
                 methods; iterative methods; iterative Wiener filter;
                 linear system identification; Linear systems; linear
                 systems; long length impulse responses; Matrix
                 decomposition; nearest Kronecker product; nearest
                 Kronecker product decomposition; optimal impulse
                 responseapproximation; Speech processing; statistical
                 analysis; statistics estimation; System identification;
                 system identification problem; transient response;
                 Wiener filter; Wiener filters",

  author =       "F. Xiong and S. Goetze and B. Kollmeier and B. T.
  title =        "Exploring Auditory-Inspired Acoustic Features for Room
                 Acoustic Parameter Estimation From Monaural Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1809--1820",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic characterisation; acoustic environments;
                 acoustic features; acoustic noise; acoustic signal
                 processing; architectural acoustics; artificial neural
                 network; auditory-inspired acoustic features; automatic
                 speech recognition; blind estimation; blind ROom
                 Parameter Estimator; channel bank filters;
                 early-to-late reverberation ratio; ELR estimation;
                 Estimation; Frequency modulation; fullband signals;
                 improved fullband estimations; individual filters;
                 machine learning; monaural speech; neural nets;
                 real-time applications; reverberant environments;
                 reverberation; Reverberation; reverberation time;
                 Reverberation time; room acoustic parameter estimation;
                 room acoustic parameters; room impulse responses; ROPE
                 model; ROPE performance; signal enhancement algorithms;
                 single-microphone speech signals; spectral analysis;
                 Speech enhancement; speech enhancement; speech
                 recognition; speech time-frequency representation;
                 speech variability; subband signals; temporal
                 modulation filter bank; temporal modulation
                 frequencies; time 3.0 s; transient response",

  author =       "G. {Le Lan} and D. Charlet and A. Larcher and S.
  title =        "An Adaptive Method for Cross-Recording Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1821--1832",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic conditions; acoustic mismatch; Acoustics;
                 Adaptation models; between-recording variability
                 compensation methods; between-recording variability
                 estimation; cross-recording DER; cross-recording
                 speaker diarization; domain adaptation; Estimation;
                 Hidden Markov models; initial training dataset; linking
                 system; Mathematical model; out-of-domain data; Radio
                 recordings; scalable unsupervised adaptation framework;
                 Speaker diarization; speaker linking; speaker
                 recognition; Task analysis; Training; unlabeled
                 speakers; unsupervised learning; variable collection

  author =       "W. Xue and A. H. Moore and M. Brookes and P. A.
  title =        "Modulation-Domain Multichannel {Kalman} Filtering for
                 Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1833--1847",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Array signal processing; Correlation; Estimation;
                 Fourier transforms; inter-frame temporal evolution;
                 interchannel spatial correlation; interframe temporal
                 correlation; Kalman filtering; Kalman filters;
                 microphone arrays; Microphones; modulation domain;
                 modulation-domain multichannel Kalman filterng;
                 multichannel KF; multichannel methods; Noise
                 measurement; optimal filters; optimal MKF gain;
                 second-order signal statistics; single-channel Kalman;
                 single-channel modulation-domain KF; single-channel
                 speech enhancement methods; Speech enhancement; speech
                 enhancement; Speech enhancement; speech spectrum",

  author =       "K. Wu and V. G. Reju and A. W. H. Khong",
  title =        "Multisource {DOA} Estimation in a Reverberant
                 Environment Using a Single Acoustic Vector Sensor",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1848--1859",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; acoustic vector sensor;
                 blind source separation; direction-of-arrival
                 estimation; Direction-of-arrival estimation;
                 direction-of-arrival estimation; DOA estimation;
                 Estimation; Indexes; low-reverberant-single-source;
                 LRSS detection; LRSS point detection; Microphones;
                 multiple sources; multiple speech sources; multisource
                 DOA estimation; multisource reverberant environments;
                 reverberant environment; Reverberation; reverberation;
                 Robot sensing systems; signal detection; single
                 acoustic vector sensor; source signals; speech
                 processing; TF domain; TF-point level; TF-zone level;
                 time-frequency analysis; time-frequency domain",

  author =       "J. Huang and Y. Sun and W. Zhang and H. Wang and T.
  title =        "Entity Highlight Generation as Statistical and Neural
                 Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1860--1872",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "attention mechanism; Computational modeling; copy
                 mechanism; coverage mechanism; Decoding; decoding
                 process; Entity highlight generation; entity highlight
                 generation; entity name; entity-specific highlights;
                 language translation; learning (artificial
                 intelligence); Manuals; natural language processing;
                 neural machine translation; neural nets; neural
                 summarization; Seq2Seq approach; Seq2Seq model;
                 sequence-to-sequence learning approach; Speech
                 processing; statistical analysis; statistical machine
                 translation; Task analysis; Training data; Web search",

  author =       "Q. T. Do and S. Sakti and S. Nakamura",
  title =        "Sequence-to-Sequence Models for Emphasis Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1873--1883",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "emphasis estimation; Emphasis estimation; Emphasis
                 Speech Translation Speech-to-speech translation
                 systems; emphasis translation; emphasis translation
                 task; Hidden Markov models; joint optimization; joint
                 optimization of words and emphasis; joint translation
                 model; language translation; Linguistics; natural
                 language processing; optimisation; Optimization;
                 Pipelines; Quantization (signal); S2ST systems;
                 sequence translation tasks; sequence-to-sequence
                 models; Speech processing; speech processing; speech
                 synthesis; speech-to-speech translation (S2ST); Task
                 analysis; translation models; translation performance",

  author =       "F. Fontana and E. Bozzo",
  title =        "Explicit Fixed-Point Computation of Nonlinear
                 Delay-Free Loop Filter Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1884--1896",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Computational modeling; delay-free loops; Digital
                 delay-free loop; digital filters; discrete-time
                 nonlinear filter networks; discrete-time realization;
                 EMS VCS3 analog synthesizer; explicit fixed-point
                 computation; fixed-point method; fixed-point search;
                 fixed-point solvers; Integrated circuit modeling;
                 iterative method; iterative methods; Mathematical
                 model; Modulation; nonlinear delay-free loop filter
                 networks; nonlinear differential equations; nonlinear
                 filter network; nonlinear filters; Numerical models;
                 ring modulator; RLC circuits; Speech processing;
                 voltage-controlled filter; voltage-controlled

  author =       "S. Widmark",
  title =        "Causal {IIR} Audio Precompensator Filters Subject to
                 Quadratic Constraints",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1897--1912",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; causal IIR audio
                 precompensator filters; computational complexity;
                 control system synthesis; Convex functions; Delays;
                 Design methodology; discrete time filters;
                 discrete-time multiple-input multiple-output filter;
                 feedforward; Finite impulse response filters; FIR
                 filters; Frequency-domain analysis; gain control; IIR
                 filters; impulse response Wiener filtering; infinite
                 impulse response Wiener precompensator design; linear
                 feedforward controller design; linear quadratic
                 control; linear quadratic optimal; linear systems;
                 Loudspeakers; optimization methods; Signal processing
                 algorithms; Transfer functions; transient response;
                 Wiener filters",

  author =       "F. Winter and H. Wierstorf and C. Hold and F.
                 Kr{\"u}ger and A. Raake and S. Spors",
  title =        "Colouration in Local Wave Field Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1913--1924",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic field; acoustic signal processing;
                 ambisonics; colouration; driving signals; emitted sound
                 fields; extended listening area; Frequency-domain
                 analysis; Harmonic analysis; hearing; listening
                 experiments; local wave field synthesis; Loudspeakers;
                 loudspeakers; Mathematical model;
                 near-field-compensated higher order ambisonics;
                 perceived colouration; Rendering (computer graphics);
                 Sound field synthesis; sound field synthesis
                 techniques; Speech processing; timbre; Timbre; wave
                 field synthesis",

  author =       "A. H. Andersen and J. M. {de Haan} and Z. Tan and J.
  title =        "Nonintrusive Speech Intelligibility Prediction Using
                 Convolutional Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1925--1939",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Artificial intelligence; Auditory system;
                 computational structure; convolution; Convolutional
                 neural networks; convolutional neural networks; deep
                 learning; learning (artificial intelligence); neural
                 nets; Noise measurement; nonintrusive SIP algorithms;
                 Nonintrusive speech intelligibility prediction;
                 nonintrusive speech intelligibility prediction;
                 Prediction algorithms; Signal processing algorithms;
                 speech intelligibility; Speech processing; speech
                 processing; speech processing algorithms; speech
                 processing devices",

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1940--1941",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "1942--1944",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "C3--C3",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "10",
  pages =        "C4--C4",
  month =        oct,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "C1--C1",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "C2--C2",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "1945--1946",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents [Edics]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "1947--1948",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "H. Hadian and H. Sameti and D. Povey and S.
  title =        "Flat-Start Single-Stage Discriminatively Trained
                 {HMM}-Based Models for {ASR}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "1949--1961",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "automatic speech recognition; CD modeling approach;
                 Context modeling; Databases; Decoding; discriminatively
                 trained HMM-based models; flat-start; flat-start
                 single-stage; Hidden Markov models; hidden Markov
                 models; hidden Markov models-GMM models; Lattice-free;
                 lattice-free maximum mutual information objective
                 function; LF-MMI setup; Linear programming; maximum
                 mutual information; Neural networks; regular tree-based
                 CD modeling; single-stage; speech recognition;
                 Training; tree-building steps; tree-free CD modeling
                 technique; vocabulary continuous speech recognition",

  author =       "F. Katzberg and R. Mazur and M. Maass and P. Koch and
                 A. Mertins",
  title =        "A Compressed Sensing Framework for Dynamic Sound-Field
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "1962--1975",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "bandlimited signals; compressed sensing; Compressed
                 sensing; compressed sensing framework; compressed
                 sensing models; compressed sensing problem;
                 compressed-sensing based recovery; dynamic sampling
                 problem; dynamic sound-field measurement; dynamic
                 sound-field measurements; Interpolation; interpolation;
                 Linear systems; Mathematical model; microphone array;
                 microphone positions; microphone trajectory;
                 Microphones; modeled equidistant grid; modeled virtual
                 grid; Nyquist-Shannon sampling theorem; random chosen
                 trajectories; room impulse responses; sampling
                 positions; signal reconstruction; signal sampling;
                 sound-field variables; sparse Fourier representations;
                 spatial sampling problem; spatio-temporal sampling
                 problem; Speech processing; stationary microphones;
                 sub-Nyquist sampling; suboptimally chosen trajectories;
                 three-dimensional space; Trajectory; transient
                 response; underdetermined sampling problems",

  author =       "H. Sundar and T. V. Sreenivas and C. S. Seelamantula",
  title =        "{TDOA-Based} Multiple Acoustic Source Localization
                 Without Association Ambiguity",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "1976--1990",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; array signal processing;
                 Delays; direction-of-arrival estimation;
                 Direction-of-arrival estimation; GCC-PHAT; hyperboloid
                 branches; IDIR; interhyperboloidal spatial region;
                 inverse delay interval region; microphone arrays;
                 microphone pairs; microphones; Microphones;
                 multi-source localization; multiple acoustic source
                 localization; multiple source localization; permutation
                 problem; Position measurement; region-constrained
                 localization; reverberation; Reverberation;
                 reverberation; speaker recognition; Speech processing;
                 TDOA; time-difference of arrival; time-differences of
                 arrival; time-of-arrival estimation",

  author =       "R. Sahraeian and D. {Van Compernolle}",
  title =        "Cross-Entropy Training of {DNN} Ensemble Acoustic
                 Models for Low-Resource {ASR}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "1991--2001",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; Acoustics; cross-entropy
                 objective function; cross-entropy training; Deep neural
                 networks; DNN ensemble acoustic models; entropy;
                 feature extraction; Feature extraction; Hidden Markov
                 models; Interpolation; language-independent feature
                 extractors; Low resource ASR; low-resource ASR;
                 low-resource target language; model combination;
                 multilingual deep neural networks; multilingual DNN
                 acoustic model; multilingual DNN training; multilingual
                 GlobalPhone dataset; natural language processing;
                 neural nets; Neural networks; out-of-language data;
                 speech recognition; Training; Training data;
                 under-resourced languages",

  author =       "H. Dinkel and Y. Qian and K. Yu",
  title =        "Investigating Raw Wave Deep Neural Networks for
                 End-to-End Speaker Spoofing Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2002--2014",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "ASV system; ASVspoof2015 dataset; automatic speaker
                 verification; Biological neural networks; convolution;
                 convolutional LSTM neural network; deep convolutional
                 long short-term memory; Deep learning; end-to-end;
                 end-to-end speaker spoofing detection; Feature
                 extraction; feature extraction; feedforward neural
                 nets; Machine learning; malicious spoofing attempts;
                 Mel frequency cepstral coefficient; raw wave deep
                 neural networks; recurrent neural nets; security of
                 data; serious security breaches; speaker recognition;
                 speaker verification; Speech processing; spoof-aware
                 features; spoofing attack; spoofing detection; Task
                 analysis; vanilla neural networks",

  author =       "J. Zhang and R. Heusdens and R. C. Hendriks",
  title =        "Rate-Distributed Spatial Filtering Based Noise
                 Reduction in Wireless Acoustic Sensor Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2015--2026",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic communication (telecommunication); acoustic
                 signal processing; array signal processing; Bit rate;
                 energy consumption; energy efficiency; energy usage;
                 fusion center; LCMV beamforming; linearly constrained
                 minimum variance beamformer; mathematical programming;
                 microphone subset; Microphones; microphones; noise
                 reduction; Noise reduction; noise reduction
                 performance; Rate allocation; rate allocation strategy;
                 rate-distributed spatial filtering; Resource
                 management; semidefinite program; sensor selection;
                 sensor-selection-based approaches; Sensors; signal
                 statistics; sparsity; spatial filters; WASN; wireless
                 acoustic sensor networks; Wireless communication;
                 wireless sensor networks; Wireless sensor networks",

  author =       "M. Heck and S. Sakti and S. Nakamura",
  title =        "{Dirichlet} Process Mixture of Mixtures Model for
                 Unsupervised Subword Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2027--2042",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustic unit discovery; Acoustics; Bayesian
                 nonparametrics; codebook; Convergence; Data models;
                 Dirichlet process; Dirichlet process mixture; ergodic
                 chain; Gibbs sampling; Hidden Markov models; Markov
                 chain Monte Carlo sampler; Markov processes; Mixture
                 models; mixture of mixtures; Monte Carlo methods;
                 nonergodic Gibbs sampler; Speech processing; speech
                 recognition; switch sampler; Switches; unsupervised
                 subword modeling",

  author =       "S. Nie and S. Liang and W. Liu and X. Zhang and J.
  title =        "Deep Learning Based Speech Separation via {NMF}-Style
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2043--2055",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "deep learning; deep neural network (DNN); deep neural
                 networks; DNN; learning (artificial intelligence);
                 Machine learning; magnitude spectrograms; matrix
                 decomposition; neural nets; Neural networks; NMF-style
                 reconstructions; Noise measurement; nonnegative matrix
                 factorization; nonnegative matrix factorization (NMF);
                 representation learning technique; spectro-temporal
                 structures; Spectrogram; Speech enhancement; speech
                 processing; Speech separation; speech separation;

  author =       "H. Dubey and A. Sangwan and J. H. L. Hansen",
  title =        "Leveraging Frequency-Dependent Kernel and {DIP}-Based
                 Clustering for Robust Speech Activity Detection in
                 Naturalistic Audio Streams",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2056--2071",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio streaming; Clustering; CRSS long-duration
                 naturalistic noise corpus; DARPA RATS; enhanced
                 spectral decomposition; FDK statistical descriptors;
                 feature extraction; frequency-dependent kernel;
                 frequency-dependent kernel based SAD features; Gaussian
                 mixture model; Gaussian processes; Hartigan dip test;
                 Hartigan dip-based robust feature clustering; Kernel;
                 learning (artificial intelligence); machine learning
                 models; model-based approach; multiple noise-sources;
                 naturalistic audio streams; NIST OpenSAD; NIST OpenSAT;
                 NIST-OpenSAD-2015; NIST-OpenSAT-2017; one-dimensional
                 FDK-SAD features; pattern clustering; peer-led team
                 learning; principal component analysis; Rats; robust
                 speech activity detection; Robustness; SAD annotations;
                 semisupervised Gaussian mixture model; Signal to noise
                 ratio; speaker recognition; speech activity detection;
                 speech processing; Speech processing; standalone SAD
                 evaluations; statistical analysis; supervised SAD;
                 text-dependent speaker verification; Training; variable
                 model-size Gaussian mixture model; VMGMM",

  author =       "Y. Jang and J. Ham and B. Lee and K. Kim",
  title =        "Cross-Language Neural Dialog State Tracker for Large
                 Ontologies Using Hierarchical Attention",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2072--2082",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "attention mechanism; attention-weighted word vector;
                 cross language; cross-language adaptation;
                 cross-language neural dialog state tracker; dialog
                 management; Dialog state tracking; dialog state
                 tracking challenge; hierarchical attention mechanism;
                 interactive systems; language translation; learning
                 (artificial intelligence); long short term memory;
                 machine learning-based trackers; machine-translated
                 training data; natural language processing; neural
                 nets; Neural networks; Ontologies; ontologies
                 (artificial intelligence); ontology; Predictive models;
                 Speech processing; Task analysis; Training data; user
                 intent identification; user utterances; vectors;
                 Vocabulary; word processing",

  author =       "G. Weisz and P. Budzianowski and P. Su and M.
  title =        "Sample Efficient Deep Reinforcement Learning for
                 Dialogue Systems With Large Action Spaces",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2083--2097",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "ACER algorithm; actor-critic methods; artificial
                 intelligence; automated dialogue agents; deep
                 reinforcement learning; Deep reinforcement learning;
                 dialogue policy optimization; Gaussian processes; human
                 computer interaction; human-computer interaction;
                 interactive systems; learning (artificial
                 intelligence); Learning (artificial intelligence);
                 Markov processes; Neural networks; off-policy
                 reinforcement learning; Optimization; policy
                 optimization task; software agents; Speech processing;
                 spoken dialogue systems; Task analysis; Training",

  author =       "S. Lin",
  title =        "Reverberation-Robust Localization of Speakers Using
                 Distinct Speech Onsets and Multichannel Cross
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2098--2111",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustic multisource localization; auditory
                 filterbank; CASA; channel bank filters; concurrent
                 speakers; correlation methods; Direction-of-arrival
                 estimation; direction-of-arrival estimation;
                 directions-of-arrival of speakers; encoded speech
                 onsets; Harmonic analysis; impulse response models;
                 microphone array recordings; microphone arrays;
                 microphone signals; Microphones; multichannel cross
                 correlation; multichannel cross correlations;
                 multichannel cross-correlation coefficient; multiple
                 microphones; onset detection; Psychoacoustic models;
                 reverberant room; reverberation; Reverberation;
                 reverberation; reverberation-robust localization;
                 separate concurrent speakers; source separation;
                 speaker localization methods; speaker recognition;
                 Speech processing; speech signal; transforms; voice
                 activity detection",

  author =       "S. Abidin and R. Togneri and F. Sohel",
  title =        "Spectrotemporal Analysis Using Local Binary Pattern
                 Variants for Acoustic Scene Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2112--2121",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustic scene; acoustic scene classification;
                 acoustic signal processing; acoustic time-frequency
                 images; capture acoustic scene information; constant-Q
                 transform; CQT; Feature extraction; feature extraction;
                 fusion; LBP; local binary pattern variants; local
                 binary patterns; Mel frequency cepstral coefficient;
                 Q-factor; signal classification; Spectrogram; temporal
                 features; time frequency analysis; time-frequency
                 analysis; Time-frequency analysis; time-frequency
                 representation; transforms; Transforms; variable-Q
                 transform; VQT",

  author =       "N. Ma and J. A. Gonzalez and G. J. Brown",
  title =        "Robust Binaural Localization of a Target Sound Source
                 by Combining Spectral Source Models and Deep Neural
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2122--2131",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; Adaptation models;
                 Auditory system; Azimuth; background model parameters;
                 background source model; binaural sound localization;
                 Binaural source localisation; biological spatial
                 hearing; Biological system modeling; Computational
                 modeling; deep neural networks; DNN-based localization
                 system; feature extraction; hearing; localization
                 process; machine hearing; machine hearing systems;
                 masking; model adaptation process; model-based
                 knowledge; neural nets; reverberation; robust binaural
                 localization; room reverberation; sound localization
                 performance; sound signals; sound source combination;
                 source azimuth posteriors output; spectral analysis;
                 spectral characteristics; spectral feature extraction;
                 spectral source models; Speech processing; target sound
                 source; target speech source; Time-frequency analysis",

  author =       "S. Wu and D. Zhang and Z. Zhang and N. Yang and M. Li
                 and M. Zhou",
  title =        "Dependency-to-Dependency Neural Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2132--2141",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Computational modeling; Decoding; decoding; dependence
                 parsing; dependence tree; encoder-decoder model;
                 encoding; language translation; Magnetic heads; neural
                 machine translation; NMT; novel sequence-to-dependence
                 framework; Predictive models; recurrent neural nets;
                 recurrent neural network; Recurrent neural networks;
                 Syntactics; Syntax; syntax-aware encoder; target
                 translation; Task analysis; translation quality;
                 translation tasks; tree structure; trees

  author =       "J. Xu and H. He and X. Sun and X. Ren and S. Li",
  title =        "Cross-Domain and Semisupervised Named Entity
                 Recognition in {Chinese} Social Media: a Unified
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2142--2152",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Chinese social media; Chinese social media language;
                 cross-domain learning; domain similarity; in-domain
                 supervised learning; in-domain unannotated information;
                 in-domain unannotated text; Kernel; learning
                 (artificial intelligence); massive unannotated text;
                 Named entity recognition; natural language processing;
                 out-of-domain corpora; Predictive models;
                 semi-supervised learning; semisupervised learning;
                 Semisupervised learning; semisupervised named entity
                 recognition; Social network services; social networking
                 (online); Speech processing; Task analysis; text
                 analysis; Training",

  author =       "S. {Van Kuyk} and W. B. Kleijn and R. C. Hendriks",
  title =        "An Evaluation of Intrusive Instrumental
                 Intelligibility Metrics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2153--2166",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "additive noise; Additive noise; CSII; Danish speech;
                 Degradation; Distortion; Dutch speech; English speech;
                 ESTOI; HASPI; HEGP; Indexes; instrumental measures;
                 intelligibility data; Intelligibility prediction;
                 intrusive instrumental intelligibility metrics;
                 Measurement; MIKNN; monaural intrusive intelligibility
                 metrics; NCM; QSTI; sEPSM; SIIB; SIMI; Speech
                 enhancement; speech enhancement; speech
                 intelligibility; statistical analysis; statistical
                 dependencies; STOI",

  author =       "X. Ouyang and K. Gu and P. Zhou",
  title =        "Spatial Pyramid Pooling Mechanism in {3D}
                 Convolutional Network for Sentence-Level
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2167--2179",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "3D CNN; 3D convolutional network; CNN; complicated
                 internal relations; Computational modeling;
                 convolution; convolutional neural network; Correlation;
                 end-to-end language processing structure; Feature
                 extraction; feature extraction; features extraction;
                 feedforward neural nets; image processing; language
                 processing; length sections; natural language
                 processing; object detection; pattern classification;
                 pooling processing; Recurrent neural networks; relation
                 classification; Relation Classification; SemEval-2010
                 Task 8 dataset; Sentence Classification; sentence
                 length variety; sentence-level classification;
                 sentences vectors; spatial pyramid pooling mechanism;
                 SPP; SPP structure; Task analysis; text analysis;
                 textual data modeling; Three-dimensional displays;

  author =       "B. McFee and J. Salamon and J. P. Bello",
  title =        "Adaptive Pooling Operators for Weakly Labeled Sound
                 Event Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2180--2193",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "active sound sources; adaptive pooling operators;
                 audio recording; audio recordings; audio signal
                 processing; autopool; average-pooling; common pooling
                 operators; convolutional neural networks; Data models;
                 deep learning; dynamic annotations; Event detection;
                 feedforward neural nets; human annotators; learning
                 (artificial intelligence); machine learning; Machine
                 learning; max-pooling; MIL problems; min-pooling;
                 multiple instance learning; multiple instance learning
                 problem; Predictive models; SED applications; SED
                 methods; segment labeling; signal detection; Sound
                 event detection; sound source; Standards; static
                 prediction; strong annotations; supervised machine
                 learning problem; Task analysis; temporally dynamic
                 predictions; time-series label prediction; Training;
                 training labels; weakly labeled sound event detection",

  author =       "I. Barbancho and G. Tzanetakis and A. M. Barbancho and
                 L. J. Tard{\'o}n",
  title =        "Discrimination Between Ascending\slash Descending
                 Pitch Arpeggios",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2194--2203",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal analysis; acoustic signal processing;
                 arpeggiated chord; ascending pitch arpeggios; audio
                 signal processing; automatic music transcription;
                 Automatic music transcription; cepstral analysis;
                 classification; descending pitch arpeggios;
                 expressiveness; feature extraction; features; Fisher
                 linear discriminant classification scheme; high-pitched
                 note; Instruments; Market research; Mel frequency
                 cepstral coefficient; Mel-frequency cepstral
                 coefficients; MFCC; music; Music; music information
                 retrieval (MIR); musical instruments; pitch direction;
                 playing technique; signal classification; Spectrogram;
                 spectrogram; Speech processing; stroke and arpeggio
                 analysis; support vector machines; SVM linear
                 classification scheme; Task analysis",

  author =       "Y. Kim and M. Kim and J. Goo and H. Kim",
  title =        "Learning Self-Informed Feature Contribution for Deep
                 Learning-Based Acoustic Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2204--2214",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic model network; Acoustic modeling; acoustic
                 signal processing; Acoustics; Artificial neural
                 networks; auxiliary deep neural network; contribution
                 gate outputs; deep learning; deep learning-based
                 acoustic modeling; DNN; element-level discriminative
                 contributions; FCN; feature contribution network;
                 feature engineering approach; feature extraction;
                 Feature extraction; gated features; Hidden Markov
                 models; input feature contributions; learning
                 (artificial intelligence); Logic gates; neural nets;
                 regularization method; self-informed feature
                 contribution learning; short-term memory-based AMNs;
                 sigmoid-based contribution gates; speech recognition;
                 Speech recognition; speech recognition; TED-LIUM
                 release 1 corpus; Training",

  author =       "M. B. {\c{C}}{\"o}teli and O. Olgun and H.
  title =        "Multiple Sound Source Localization With Steered
                 Response Power Density and Hierarchical Grid
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2215--2229",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic field; acoustic signal processing; array
                 signal processing; associated signal-adaptive search
                 method; compact spherical harmonic representation;
                 Computational efficiency; direction-of-arrival
                 estimation; Direction-of-arrival estimation;
                 direction-of-arrival estimation; DOA estimation;
                 Estimation; Harmonic analysis; hierarchical grid
                 refinement; Microphone arrays; microphone arrays;
                 multiple sound source localization; reverberation;
                 rigid spherical microphone arrays; sound field
                 analysis; Source localization; Speech processing;
                 steered response power; steered response power

  author =       "J. Bao and Y. Gong and N. Duan and M. Zhou and T.
  title =        "Question Generation With Doubly Adversarial Nets",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2230--2239",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "adversarial procedures; artificial intelligence; Data
                 models; DC-Dis; domain-classification discriminator;
                 domain-general representations; DoubAN; doubly
                 adversarial nets; doubly-adversarial net; Gallium
                 nitride; generated questions; generated text-question
                 pairs; Generators; Knowledge discovery; learning
                 (artificial intelligence); natural language processing;
                 neural networks; novel neural question generation
                 approach; pattern classification; QA-Dis; Question
                 generation; question generator; question-answering
                 discriminator; sequence-to-sequence learning; source
                 domains; source-domain labeled data; specific domain;
                 target domain; target-domain unlabeled data; Task
                 analysis; text analysis; Training; training data;
                 Training data; unsupervised learning",

  author =       "B. Bu and C. Bao and M. Jia",
  title =        "Design of a Planar First-Order Loudspeaker Array for
                 Global Active Noise Control",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2240--2250",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; acoustic transducer
                 arrays; Acoustics; active noise control; Active noise
                 control; Attenuation; general first-order sources;
                 general variable first-order responses; global active
                 noise control; Harmonic analysis; Loudspeakers;
                 loudspeakers; monopole component; noise abatement;
                 Planar arrays; planar first-order loudspeaker array
                 structure; planar loudspeaker array; planar loudspeaker
                 arrays; primary noise field; sound field; sound
                 reproduction; Speech processing; spherical harmonics;
                 tangential dipole components; Three-dimensional
                 displays; traditional spherical loudspeaker array",

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2251--2252",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "2253--2255",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "C3--C3",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "11",
  pages =        "C4--C4",
  month =        nov,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Front Cover",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "C1--C1",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "C2--C2",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2251--2252",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents [Edics]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2253--2254",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "X. Wang and Z. Tu and M. Zhang",
  title =        "Incorporating Statistical Machine Translation Word
                 Knowledge Into Neural Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2255--2266",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Chinese-to-Englishh translation; Decoding;
                 English-to-German translation tasks; hybrid
                 translation; Knowledge engineering; language
                 translation; Modeling; natural language processing;
                 Neural machine translation; neural machine translation;
                 neural nets; neural network; neural network based
                 classifier; Neural networks; NMT decoder; NMT decoding
                 information; NMT word generation probability;
                 probability; SMT word knowledge; SMT word
                 recommendations; Speech processing; statistical
                 analysis; Statistical learning; statistical machine
                 translation; Training; translation combination;
                 vocabulary; Vocabulary",

  author =       "Y. Zhao and M. Kuruvilla-Dugdale and M. Song",
  title =        "Structured Sparse Spectral Transforms and Structural
                 Measures for Voice Conversion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2267--2276",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "12 speaker pairs; Distortion; Distortion measurement;
                 frequency warping; frequency-warping characteristic;
                 high-D data; high-dimensional STRAIGHT spectra;
                 Matrices; matrix decomposition; muffled speech; NMF;
                 nonnegative matrix factorization; objective measures;
                 overfit matrix; ROS; source-target speaker pair; Sparse
                 matrices; spectral distortion; Speech processing;
                 speech processing; structural measures; structure
                 preservation; structured sparse spectral transform;
                 structured sparse spectral transforms; temporal
                 covariance; Training; transform matrix; Transforms; VC
                 method; VC speech quality; voice conversion; Voice
                 conversion; voice similarity",

  author =       "H. Salehi and D. Suelzle and P. Folkeard and V.
  title =        "Learning-Based Reference-Free Speech Quality Measures
                 for Hearing Aid Applications",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2277--2288",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; aid applications;
                 amalgamates perceptual linear prediction; Auditory
                 system; Band-pass filters; feature extraction; Feature
                 extraction; feature set; frequency-shaped reference
                 signal; full-reference HASQI performance; gammatone
                 filterbank energies; HA output; HA quality ratings; HA
                 recordings; hearing; hearing aid speech quality index;
                 hearing aids; Hearing aids; hearing aids; HL-impacted
                 gammatone auditory filterbank energies; HL-modified PLP
                 coefficients; IIR filters; learning (artificial
                 intelligence); loss modeling; Machine learning; machine
                 learning; machine learning concepts; medical signal
                 processing; objective measures; perceptual linear
                 prediction; predicted quality scores; properly
                 time-aligned; Quality assessment; reference-free HA
                 speech quality indices; reference-free quality
                 assessment; reference-free speech quality; regression
                 analysis; speech enhancement; speech intelligibility;
                 speech processing; Speech processing; speech quality;
                 Support vector machines; support vector machines;
                 support vector regression",

  author =       "G. Enzner and P. Th{\"u}ne",
  title =        "{Bayesian} {MMSE} Filtering of Noisy Speech by {SNR}
                 Marginalization With Global {PSD} Priors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2289--2304",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "a-posteriori SNR; additive noise; Bayes methods;
                 Bayesian estimation; Bayesian MMSE filtering; complex
                 speech spectral amplitudes; global distribution; global
                 PSD priors; global SNR value; joint posterior
                 distribution; latent speech power-spectral density;
                 latent speech PSD state; latent time-varying a-priori
                 SNR; latent Wiener filter; least mean squares methods;
                 local data likelihood; MMSE estimation framework; Noise
                 measurement; noisy speech; residual noise; Signal to
                 noise ratio; single-channel speech enhancement; SNR
                 marginalization; spectral analysis; speech enhancement;
                 Speech enhancement; speech quality; speech-in-noise
                 condition; speech-PSD posterior; stationary Wiener
                 filters; statistical analysis; statistical estimators;
                 Time-frequency analysis; Wiener filters",

  author =       "G. Huang and J. Chen and J. Benesty",
  title =        "Insights Into Frequency-Invariant Beamforming With
                 Concentric Circular Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2305--2318",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "array signal processing; Array signal processing;
                 CCMA; circular microphone arrays; concentric circular
                 microphone arrays; deep nulls problem; directivity
                 factor; fixed and differential beamforming;
                 frequency-invariant beamforming; frequency-invariant
                 beampattern; Jacobi-Anger expansion; Jacobian matrices;
                 Microphone arrays; microphone arrays; Microphone
                 arrays; Nth-order symmetric beampatterns; Sensor
                 arrays; Speech processing; white noise gain",

  author =       "{Ayana} and S. Shen and Y. Chen and C. Yang and Z. Liu
                 and M. Sun",
  title =        "Zero-Shot Cross-Lingual Neural Headline Generation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2319--2327",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "cross-lingual headline generation; Data models; direct
                 source language articles; direct source-to-target CNHG
                 model; English-Chinese headline generation evaluation
                 datasets; headline generation; language translation;
                 monolingual headline generation; natural language
                 processing; Neural network; Neural networks; NHG
                 systems; parameterized CNHG model; source document;
                 Speech processing; summarization phases; target
                 language headlines; text analysis; Training; Training
                 data; zero-shot cross-lingual neural headline
                 generation; zero-shot scenario",

  author =       "S. Surendran and T. K. Kumar",
  title =        "Oblique Projection and Cepstral Subtraction in Signal
                 Subspace Speech Enhancement for Colored Noise
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2328--2340",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "additive noise subspace; cepstral domain; cepstral
                 subtraction; clean speech signal; Colored noise;
                 colored noise reduction; colored noise removal;
                 Covariance matrices; Distortion; Masking property;
                 matrix algebra; Noise measurement; noisy speech
                 subspace; oblique projection; orthogonal noise
                 subspace; residual noise; signal subspace approach;
                 signal subspace speech enhancement; spectral domain
                 constrained estimator; Speech enhancement; speech
                 enhancement; speech enhancement methods; subspace
                 speech enhancement method; variance normalization",

  author =       "Q. Li and D. F. Wong and L. S. Chao and M. Zhu and T.
                 Xiao and J. Zhu and M. Zhang",
  title =        "Linguistic Knowledge-Aware Neural Machine
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2341--2354",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Attention gate; Decoding; Encoding; encoding;
                 knowledge block; knowledge gate; knowledge-aware NMT
                 approach; language translation; linguistic
                 knowledge-aware neural machine translation;
                 Linguistics; linguistics; natural language processing;
                 neural machine translation (NMT); NMT encoder;
                 recurrent neural nets; recurrent neural network;
                 Recurrent neural networks; RNN encoder; Speech
                 processing; syntactic information; Syntactics; word
                 embeddings; word representation",

  author =       "W. Zhang and C. Hofmann and M. Buerger and T. D.
                 Abhayapala and W. Kellermann",
  title =        "Spatial Noise-Field Control With Online Secondary Path
                 Modeling: a Wave-Domain Approach",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2355--2370",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; active noise control;
                 Active noise control; Active noise reduction; Adaptive
                 algorithms; adaptive feedback control; adaptive
                 processing; feedback; feedback system; least mean
                 squares methods; loudspeakers; Loudspeakers; low-level
                 auxiliary noise; microphone array placement; microphone
                 arrays; Microphone arrays; multichannel active noise
                 control; multichannel ANC; nonconcentric circular
                 loudspeakers; online secondary path modeling; secondary
                 path modelling; Sensors; spatial noise-field control;
                 strong interchannel interference; tonal noise;
                 Transforms; wave domain; wave-domain adaptation
                 algorithm; wave-domain secondary path model",

  author =       "A. Meynard and B. Torr{\'e}sani",
  title =        "Spectral Analysis for Nonstationary Audio",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2371--2380",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Amplitude modulation; approximate maximum-likelihood
                 approach; audio signal processing; deformation; Doppler
                 effect; Gaussian processes; Gaussian stationary random
                 signals; local spectrum; maximum likelihood estimation;
                 nonstationary audio signals; Nonstationary signals;
                 spectral analysis; Speech processing;
                 stationarity-breaking operators; time warping; wavelet
                 analysis; Wavelet analysis; wavelet transform domain;
                 wavelet transforms; Wavelet transforms",

  author =       "I. Mart{\'\i}n-Morat{\'o} and M. Cobos and F. J.
  title =        "Adaptive Mid-Term Representations for Robust Audio
                 Event Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2381--2392",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic event detection; adaptive mid-term
                 representations; alternative event representation;
                 audio analysis tasks; Audio event classification; audio
                 scene classification; audio signal processing; audio
                 signals; distance-based texture windows; Event
                 detection; event segmentation stage; feature
                 extraction; Feature extraction; feature space;
                 fixed-length feature vectors; fixed-length
                 representation; Hidden Markov models; image
                 classification; image segmentation; image texture;
                 improved statistical description; low-level audio
                 features; mid-term segments; mid-term statistics;
                 nonlinear time normalization; robust audio event
                 classification; robust mid-term statistical
                 description; Robustness; sampling methods; short-term
                 features; short-term temporal framing; Statistics;
                 support vector machines; Support vector machines;
                 temporal evolution; temporal information; temporal
                 variability; trace-segmentation; uniform distance
                 subsampling; variable length; vectors",

  author =       "G. Firtha and P. Fiala and F. Schultz and S. Spors",
  title =        "On the General Relation of Wave Field Synthesis and
                 Spectral Division Method for Linear Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2393--2403",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic arrays; acoustic signal processing;
                 appropriate boundary integral representation; arbitrary
                 target sound field reproduction; arbitrary virtual
                 sound field; densely spaced loudspeaker ensemble;
                 explicit analytic method; explicit solution aims;
                 extended listening area; Geometry; Green's function
                 methods; high-frequency approximation; implicit
                 analytic method; integral equation; Integral equations;
                 integral equations; linear arrays; loudspeakers;
                 Receivers; required loudspeaker driving functions;
                 sound field synthesis; sound reproduction; spectral
                 division method; spectral integral; Speech processing;
                 target field specific synthesis scenarios;
                 Three-dimensional displays; Two dimensional displays;
                 Wave field synthesis; wave field synthesis",

  author =       "P. Birkholz and S. Stone and K. Wolf and D.
  title =        "Non-Invasive Silent Phoneme Recognition Using
                 Microwave Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2404--2411",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Antenna measurements; audible speech; electromagnetic
                 transmission spectra; frequency 2.0 GHz to 12.0 GHz;
                 k-nearest neighbors; linear discriminant analysis;
                 microwave detectors; microwave signals; multiple
                 phonetic contexts; nearest neighbour methods;
                 noninvasive silent phoneme recognition; Radar antennas;
                 Sensors; Silent-speech interface; silent-speech
                 interfaces; silent-speech technology; Speech
                 processing; Speech recognition; speech recognition;
                 Speech synthesis; Vivaldi antennas",

  author =       "W. Lin and M. Mak and J. Chien",
  title =        "Multisource {I}-Vectors Domain Adaptation Using
                 Maximum Mean Discrepancy Based Autoencoders",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2412--2422",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Adaptation models; Covariance matrices; data
                 distributions; domain adaptation; domain-invariant
                 autoencoder; domainwise MMD; generalized MMD;
                 i-vectors; i-vectors domain adaptation; learning
                 (artificial intelligence); Machine learning; machine
                 learning tasks; maximum mean discrepancy; maximum mean
                 discrepancy based autoencoders; MMD-based autoencoders;
                 multisource i-vector adaptation; multisource mismatch;
                 NIST; probability distributions; Robustness; speaker
                 recognition; Speaker verification; speaker verification
                 systems; speech coding; Speech processing; statistical
                 distributions; Training; Training data; vectors",

  author =       "M. Abdelwahab and C. Busso",
  title =        "Domain Adversarial for Acoustic Emotion Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2423--2435",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic emotion recognition; acoustic signal
                 processing; adversarial multitask training; adversarial
                 training; data annotation; data distributions; Data
                 models; data representations; deep neural network;
                 domain adversarial; domain classifier; emotion
                 recognition; Emotion recognition; emotion recognition
                 performance; emotional classifiers; emotional
                 dimensions; emotional-attribute-based descriptor
                 prediction; gradient methods; gradient reversal layer;
                 image classification; image representation; learning
                 (artificial intelligence); neural nets; performance
                 gap; shallow neural network; source domain; Speech
                 emotion recognition; speech emotion recognition; Speech
                 processing; speech recognition; Speech recognition;
                 target domain representations; test domains; Testing;
                 testing data; testing performance; Training; unlabeled
                 adaptation of acoustic emotional models; unlabeled

  author =       "D. {El Badawy} and I. Dokmani{\'c}",
  title =        "Direction of Arrival With One Microphone, a Few
                 {LEGOs}, and Non-Negative Matrix Factorization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2436--2446",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; ad hoc scatterers;
                 arbitrary scattering structure; direction of arrival
                 estimation; direction-dependent way;
                 direction-of-arrival estimation; Direction-of-arrival
                 estimation; frequency response; group sparsity; inverse
                 problem; inverse problems; learned nonnegative
                 dictionaries; learning (artificial intelligence); LEGO
                 bricks; localizing speech; matrix decomposition;
                 Microphones; microphones; monaural localization;
                 monaural speech localization algorithm; multisource
                 localization; non-negative matrix factorization;
                 nonnegative dictionaries; nonnegative matrix
                 factorization; rudimentary structures; Scattering;
                 single microphone; sound scattering; sound source
                 localization; Speech processing; speech processing;
                 unilateral hearing loss; universal speech model; white
                 noise; White noise; white noise",

  author =       "H. Lee and P. Chung and Y. Wu and T. Lin and T. Wen",
  title =        "Interactive Spoken Content Retrieval by Deep
                 Reinforcement Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2447--2459",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "content-based retrieval; deep reinforcement learning;
                 deep-Q-learning; deep-Q-network; DQN; Feature
                 extraction; hand-crafted states; interactive spoken
                 content retrieval; interactive systems; Learning
                 (artificial intelligence); learning (artificial
                 intelligence); machine actions; Machine learning;
                 Multimedia communication; reinforcement learning;
                 Reinforcement learning; retrieval results; retrieved
                 items; Speech processing; speech recognition; Speech
                 recognition; Spoken content retrieval; text content
                 retrieval; User interfaces; user-machine interaction",

  author =       "S. Elshamy and N. Madhu and W. Tirry and T.
  title =        "{DNN}-Supported Speech Enhancement With Cepstral
                 Estimation of Both Excitation and Envelope",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2460--2474",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "${a\; a priori SNR estimation; CEM technique; Cepstral
                 analysis; cepstral domain; cepstral excitation
                 manipulation technique; classical MMSE short time
                 spectral amplitude estimator; clean
                 envelope-representing coefficients; clean spectral
                 envelopes; Deep learning; deep neural network approach;
                 DNN-supported speech enhancement; filtering theory;
                 hidden Markov model; Hidden Markov models; hidden
                 Markov models; human speech production; least mean
                 squares methods; neural nets; noise attenuation; Noise
                 reduction; noise reduction framework; noisy conditions;
                 priori}$SNR; Signal to noise ratio; source-filter
                 model; spectral analysis; speech component; Speech
                 enhancement; speech enhancement; speech spectral
                 envelope-based noise reduction",

  author =       "Y. Bao and H. Chen",
  title =        "A Chance-Constrained Programming Approach to the
                 Design of Robust Broadband Beamformers With Microphone
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2475--2488",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "array response distortion distribution property; array
                 signal processing; Broadband beamformers; Broadband
                 communication; CCP-based design problem; chance
                 constraint probability; chance-constrained programming;
                 chance-constrained programming based design approach;
                 chance-constrained stopband level constraint;
                 computational complexity; convex programming;
                 Distortion; Microphone arrays; microphone arrays;
                 microphone mismatches; NP-hard problem; Optimization;
                 overconservatism problem; Passband; probability;
                 relaxed convex optimization formulation; robust
                 broadband beamformers; robustness; Robustness;
                 WMPO-based design approaches; worst case mean
                 performance optimization; worst-case mean performance

  author =       "Anonymous",
  title =        "Farewell Editorial",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2489--2489",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "List of Reviewers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2490--2496",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "IEEE publishing",

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE\slash ACM Transactions on Audio,
                 Speech, and Language Processing}}} Edics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2497--2498",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{{\booktitle{IEEE Transactions on Multimedia}}}
                 information for authors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2499--2501",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE} Open Access Publishing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2502--2502",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "2018 Index {{\booktitle{IEEE\slash ACM Transactions on
                 Audio, Speech, and Language Processing}}} Vol. 26",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "2503--2528",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "C3--C3",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Blank page",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "26",
  number =       "12",
  pages =        "C4--C4",
  month =        dec,
  year =         "2018",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "C1--1",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "C2--C2",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents [Edics]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "2--3",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "[{Blank} page]",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "B4--B4",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Inaugural Editorial Innovations in an Era of
                 Ubiquitous Audio, Speech, and Language Processing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "5--6",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "F. Bao and W. H. Abdulla",
  title =        "A New Ratio Mask Representation for {CASA}-Based
                 Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "7--19",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "binary mask; CASA-based speech enhancement; channel
                 bank filters; channel-weight contour; Computational
                 auditory scene analysis (CASA); Correlation; deep
                 neural networks (DNN); equal loudness hearing
                 attribute; five-layer structured deep neural network;
                 Gammatone filterbank channel; hearing; ICC; ideal ratio
                 mask (IRM); inter-channel correlation; neural nets;
                 Noise measurement; noise ratio conditions; ratio mask;
                 ratio mask representation; revised ratio mask; Signal
                 to noise ratio; source separation; spectral distortion;
                 speech enhancement; Speech enhancement; speech
                 enhancement; speech processing; speech quality;
                 speech-noise power ratio; Standards; Training; Wiener
                 filtering; Wiener filters",

  author =       "P. Magron and T. Virtanen",
  title =        "Complex {ISNMF}: a Phase-Aware Model for Monaural
                 Audio Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "20--31",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Adaptation models; anisotropic Gaussian model; audio
                 signal processing; audio source separation; Bayes
                 methods; Bayesian anisotropic Gaussian source model;
                 Bayesian inference; circularly-symmetric Gaussian;
                 complex ISNMF; complex Itakura-Saito NMF; complex NMF;
                 Estimation; expectation-maximisation algorithm; Fourier
                 transforms; Gaussian distribution; Gaussian processes;
                 Itakura Saito divergence; Markov chain prior structure;
                 matrix decomposition; monaural audio source separation;
                 musical source separation task; nonisotropic variables;
                 nonnegative matrix factorization; Nonnegative matrix
                 factorization (NMF); phase constraints; phase recovery;
                 phase-aware model; phase-aware probabilistic model;
                 probability; Random variables; short-time Fourier
                 transform domain; signal model; source separation;
                 Source separation; Speech processing; state-of-the-art
                 phase-aware separation techniques",

  author =       "T. T. H. Duong and N. Q. K. Duong and P. C. Nguyen and
                 C. Q. Nguyen",
  title =        "{Gaussian} Modeling-Based Multichannel Audio Source
                 Separation Exploiting Generic Source Spectral Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "32--43",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio signal processing; blind audio source
                 separation; blind source separation; covariance
                 analysis; Covariance matrices; Electronic mail;
                 expectation-maximisation algorithm; Frequency-domain
                 analysis; Gaussian modeling-based multichannel audio
                 source Separation; Gaussian processes; generalized
                 expectation-minimization algorithm; generic source
                 spectral model; generic spectral model; group sparsity
                 constraint; intermediate source variances; local
                 Gaussian model; matrix decomposition; Microphones;
                 Multichannel audio source separation; multichannel
                 source separation approach; NMF; nonnegative matrix
                 factorization; Parameter estimation; parameter
                 estimation; signal denoising; single-channel audio
                 mixtures; Source separation; source spatial covariance
                 model; source variance denoising; Speech processing;
                 speech processing; unified Gaussian modeling

  author =       "G. Zhang and J. Tao and X. Qiu and I. Burnett",
  title =        "Decentralized Two-Channel Active Noise Control for
                 Single Frequency by Shaping Matrix Eigenvalues",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "44--52",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "active noise control; Active noise control (ANC);
                 active noise control system; adaptive controller;
                 centralized approaches; centralized controller;
                 Computational complexity; computational complexity;
                 Convergence; Decentralized control; decentralized
                 control scheme; decentralized controller; decentralized
                 two-channel active noise control; Eigenvalues and
                 eigenfunctions; eigenvalues and eigenfunctions; error
                 microphone; error microphones; frequency domain; matrix
                 algebra; matrix eigenvalues; Microphones; microphones;
                 multiple secondary sources; noise disturbance; Noise
                 reduction; noise reduction performance; Process
                 control; small-size ANC subsystems; two-channel ANC
                 system; two-channel secondary paths",

  author =       "Y. Zhao and Z. Wang and D. Wang",
  title =        "Two-Stage Deep Learning for Noisy-Reverberant Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "53--62",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "automatic speech; background noise; deep neural
                 networks; Deep neural networks; denoising;
                 dereverberation; ideal ratio mask; iterative methods;
                 iterative phase reconstruction; learning (artificial
                 intelligence); Linear programming; neural nets; Noise
                 measurement; Noise reduction; noisy-reverberant speech
                 enhancement; objective function; one-stage enhancement
                 systems; phase; phase estimates; reverberation;
                 Reverberation; room reverberation; signal
                 reconstruction; speaker recognition; spectral
                 magnitudes estimation; speech denoising; speech
                 dereverberation; Speech enhancement; speech
                 enhancement; speech intelligibility; speech quality;
                 Time-domain analysis; Training; two-stage deep
                 learning; two-stage model",

  author =       "N. Zheng and X. Zhang",
  title =        "Phase-Aware Speech Enhancement Based on Deep Neural
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "63--76",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "corresponding magnitude spectrogram; Deep neural
                 network (DNN); deep neural networks; DNN-based methods;
                 Fourier transforms; harmonic model; incorporating
                 phase; instantaneous frequency; instantaneous frequency
                 deviation; learning (artificial intelligence); neural
                 nets; Noise measurement; phase estimation; phase
                 processing; phase-aware speech enhancement algorithm;
                 radio applications; short-time frequency; Spectrogram;
                 speech enhancement; Speech enhancement; speech
                 enhancement; speech recognition; speech-processing
                 algorithms; STFT magnitude; telecommunication;
                 Time-frequency analysis; time-frequency analysis;
                 Training; unstructured phase spectrogram; unstructured
                 STFT phase; Wrapping",

  author =       "T. Moriya and T. Tanaka and T. Shinozaki and S.
                 Watanabe and K. Duh",
  title =        "Evolution-Strategy-Based Automation of System
                 Development for High-Performance Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "77--88",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "cloud computers; cloud computing; covariance matrix
                 adaptation evolution strategy (CMA-ES); deep neural
                 network; deep neural network (DNN);
                 evolution-strategy-based automation; evolutionary
                 computation; genetic algorithm; Genetic algorithms;
                 hidden Markov model; hidden Markov models; Hidden
                 Markov models; high-performance speech recognition;
                 large vocabulary speech recognition system;
                 meta-parameters; multi-objective optimization;
                 multiobjective Pareto optimization; neural nets;
                 Optimization; parallel computation; parallel
                 processing; Pareto optimisation; Speech processing;
                 Speech recognition; speech recognition; system
                 development; Training; Vocabulary; word error rate",

  author =       "H. Kamper and G. Shakhnarovich and K. Livescu",
  title =        "Semantic Speech Retrieval With a Visually Grounded
                 Model of Untranscribed Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "89--98",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Analytical models; automatic speech recognition; Data
                 models; external image tagger; human semantic relevance
                 judgements; information retrieval; keyword spotting;
                 learning (artificial intelligence); multimodal
                 modelling; natural language processing; neural model;
                 neural nets; nonverbatim semantic matches; parallel
                 speech; Predictive models; semantic retrieval; semantic
                 speech retrieval; Semantics; speech processing; Speech
                 processing; speech recognition; speech retrieval; Task
                 analysis; unlabelled speech; untranscribed speech;
                 visual context; Visual grounding; Visualization;
                 visually grounded speech model",

  author =       "M. S. Kavalekalam and J. K. Nielsen and J. B. Boldt
                 and M. G. Christensen",
  title =        "Model-Based Speech Enhancement for Intelligibility
                 Improvement in Binaural Hearing Aids",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "99--113",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic scenarios representative; acoustic signal
                 processing; autoregressive model; binaural
                 codebook-based method; binaural enhancement; binaural
                 hearing aids; binaural speech enhancement framework;
                 clean speech pitch parameters; cocktail party scenario;
                 directional pitch estimator; Ear; enhancement process;
                 Estimation; filter parameters; harmonic model; hearing
                 aid technology; hearing aids; hearing impaired
                 individuals; intelligibility improvement; Kalman
                 filter; Kalman filters; Mathematical model; maximum
                 likelihood estimation; maximum likelihood principle;
                 model-based speech enhancement; Noise measurement;
                 normal hearing subjects; pitch estimation; pitch
                 parameters; robust estimation; Speech enhancement;
                 speech enhancement; speech intelligibility; speech
                 production dynamics; speech production model; speech
                 quality; STP parameters",

  author =       "A. R. MV and P. K. Ghosh",
  title =        "Glottal Inverse Filtering Using Probabilistic Weighted
                 Linear Prediction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "114--124",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "all-pole filter; Computational modeling; Data models;
                 filter coefficients; filtering theory; Gibbs sampling;
                 GIF; glottal closure; glottal cycle; glottal flow
                 estimate; glottal inverse filtering; Glottal inverse
                 filtering; Indexes; Lijencrants-Fant model; Lips;
                 physical model; probabilistic interpretation;
                 Probabilistic logic; probabilistic temporal weighting;
                 probabilistic weighted linear prediction; probability;
                 Random variables; speech data; speech processing;
                 Speech processing; synthetic data",

  author =       "Y. Sun and W. Wang and J. Chambers and S. M. Naqvi",
  title =        "Two-Stage Monaural Source Separation in Reverberant
                 Room Environments Using Deep Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "125--139",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; current state-of-the-art
                 methods; deep neural networks; Deep neural networks;
                 dereverberant speech mixture; dereverberation mask; DM;
                 DNN-based method; highly reverberant room environments;
                 ideal enhanced mask; ideal ratio mask; IEM;
                 Interference; IRM; monaural source separation; monaural
                 source separation problem; neural nets; Neural
                 networks; Noise measurement; NOISEX dataset;
                 reverberant room environments; reverberation;
                 Reverberation; room impulse responses; single DNN;
                 source separation; Source separation; speech
                 intelligibility; speech mixture dereverberation; speech
                 processing; Speech processing; TIMIT corpora; Training;
                 transient response; two-stage approach; two-stage
                 monaural source separation",

  author =       "L. Ferrer and M. K. Nandwana and M. McLaren and D.
                 Castan and A. Lawson",
  title =        "Toward Fail-Safe Speaker Recognition: Trial-Based
                 Calibration With a Reject Option",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "140--153",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Bayes methods; calibration; Calibration; calibration
                 loss; calibration step; candidate training;
                 Computational modeling; Data models; evaluation
                 conditions; forensic voice comparison; Forensics;
                 Gaussian processes; learning (artificial intelligence);
                 Logistics; matched calibration data; matched data;
                 reject option; relevant calibration data; separate
                 calibration model; Speaker recognition; speaker
                 recognition; speaker recognition systems; standard
                 calibration approach; TBC method; toward fail-safe
                 speaker recognition; Training; training data;
                 trial-based calibration",

  author =       "J. Amini and R. C. Hendriks and R. Heusdens and M. Guo
                 and J. Jensen",
  title =        "Asymmetric Coding for Rate-Constrained Noise Reduction
                 in Binaural Hearing Aids",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "154--167",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "advanced noise reduction algorithms; Array signal
                 processing; asymmetric coding; asymmetric sequential
                 coding scheme; binaural hearing aids; Binaural hearing
                 aids (HAs); complete joint noisy signal statistics;
                 hearing aids; information bit-rate; mean square error
                 distortion measure; mean square error methods; medical
                 signal processing; microphones; Microphones; monaural
                 beamforming; monaural-bilateral HA; multi-microphone
                 noise reduction; Noise measurement; Noise reduction;
                 optimal rate-constrained beamforming strategy;
                 Quantization (signal); rate-constrained noise
                 reduction; remote source coding; sequential codes;
                 signal denoising; Source coding; speech coding;
                 sub-optimal rate; sub-optimal strategies; transmission

  author =       "J. Yu and J. Jiang and R. Xia",
  title =        "Global Inference for Aspect and Opinion Terms
                 Co-Extraction Based on Multi-Task Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "168--177",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "aspect term extraction; aspect terms; Benchmark
                 testing; data mining; global inference approach; global
                 inference method; inference mechanisms; inter-task
                 relationship; Labeling; learning (artificial
                 intelligence); multitask learning framework; multitask
                 neural networks; Natural language processing; neural
                 nets; neural network architectures; Neural networks;
                 neural networks; neural predictions; opinion mining;
                 opinion term extraction; opinion terms co-extraction;
                 Sentiment analysis; sentiment analysis; Standards;
                 syntactic constraints; syntactic relations; Syntactics;
                 Task analysis",

  author =       "Z. Wang and X. Zhang and D. Wang",
  title =        "Robust Speaker Localization Guided by Deep
                 Learning-Based Time-Frequency Masking",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "178--188",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic noise; acoustic signal processing; audio
                 signal processing; conventional localization
                 algorithms; deep learning-based time-frequency masking;
                 deep neural networks; Delay effects; direction of
                 arrival estimation; Direction-of-arrival estimation;
                 direction-of-arrival estimation; Estimation; GCC-PHAT;
                 generalized cross correlation; ideal ratio mask;
                 intense noise; learning (artificial intelligence);
                 Microphones; microphones; monaural spectral
                 information; monaural speech enhancement; monaural
                 speech separation; neural nets; noisy environments;
                 reverberant environments; Reverberation; robust speaker
                 localization; room reverberation; Signal processing
                 algorithms; Signal to noise ratio; single-channel;
                 speech dominant T-F units; speech processing;
                 steered-response power; steering vectors;
                 time-frequency analysis; time-frequency masking;
                 traditional DOA estimation methods; trained model",

  author =       "K. Tan and J. Chen and D. Wang",
  title =        "Gated Residual Networks With Dilated Convolutions for
                 Monaural Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "189--198",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "bidirectional LSTM model; CNN model; contextual
                 information; Convolution; convolutional neural network
                 architecture; deep neural networks; dilated
                 convolutions; Dilated convolutions; feedforward neural
                 nets; gated linear units; gated residual networks;
                 gating mechanisms; generalisation (artificial
                 intelligence); learning (artificial intelligence);
                 Logic gates; long-term contexts; mask estimation;
                 monaural speech enhancement; Noise measurement;
                 objective speech intelligibility; quality metrics;
                 recurrent neural nets; residual learning;
                 sequence-to-sequence mapping; Signal to noise ratio;
                 spectral mapping; speech enhancement; Speech
                 enhancement; speech enhancement; speech
                 intelligibility; supervised speech enhancement;
                 systematic context aggregation; target speaker
                 tracking; temporal contexts; Training; unidirectional
                 long short-term memory; unidirectional LSTM model",

  author =       "G. H. Ngo and M. Nguyen and N. F. Chen",
  title =        "Phonology-Augmented Statistical Framework for Machine
                 Transliteration Using Limited Linguistic Resources",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "199--211",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "consonant cluster; cross-lingual information
                 retrieval; Data models; foreign word; language
                 translation; linguistic resources; linguistics; machine
                 translation; machine transliteration; named entity
                 recognition; natural language processing; Phonetics;
                 phonological structure; phonology-augmented statistical
                 framework; source language; Speech processing;
                 Standards; statistical analysis; statistical
                 transliteration approaches; target languages phonology;
                 Task analysis; Training; Training data;
                 Transliteration; transliteration system",

  author =       "Y. Koizumi and S. Saito and H. Uematsu and Y. Kawachi
                 and N. Harada",
  title =        "Unsupervised Detection of Anomalous Sound Based on
                 Deep Learning and the {Neyman--Pearson} Lemma",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "212--224",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal detection; and autoencoder; anomalous
                 sound; Anomaly detection in sound; anomaly score; deep
                 learning; Feature extraction; learning (artificial
                 intelligence); Linear programming; Neyman-Pearson
                 lemma; optimisation; Probability density function;
                 reconstruction error; sampling methods; security of
                 data; simulate anomalous sounds; Speech processing;
                 statistical analysis; Task analysis; Training data;
                 true positive rate; unknown anomalous sounds;
                 unsupervised anomaly detection; unsupervised detection;
                 unsupervised learning; unsupervised-ADS",

  author =       "Y. Laufer and S. Gannot",
  title =        "A {Bayesian} Hierarchical Model for Speech Enhancement
                 With Time-Varying Audio Channel",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "225--239",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic channel; Acoustics; Adaptive beamforming;
                 array signal processing; audio signal processing; Bayes
                 methods; Bayesian hierarchical model; channel
                 alignment; channel estimate; Covariance matrices;
                 expectation-maximisation algorithm; filtering theory;
                 fully Bayesian hierarchical approach; Gaussian
                 processes; Heuristic algorithms; Kalman filters; Kalman
                 smoother; Microphones; multichannel linear-Gaussian
                 state-space model; multichannel minimum variance
                 distortionless response beamformer; multichannel speech
                 enhancement; multichannel Wiener filter; MVDR
                 beamformer; noise precision matrix; noisy signal;
                 probabilistic approach; probability; reverberation;
                 reverberation levels; single-channel variational
                 postfilter; Speech enhancement; speech enhancement;
                 speech precision; speech quality; speech signal;
                 time-varying audio channel; tracking ability;
                 variational EM; variational expectation-maximization
                 algorithm; VEM speech estimator; Wiener filters",

  author =       "Anonymous",
  title =        "Erratum for Nonlinear Audio Systems Identification
                 Through Audio Input {Gaussianization}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "240--240",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Audio systems; Nonlinear systems; Speech processing",

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "1",
  pages =        "C3--C3",
  month =        jan,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "C1--241",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "C2--C2",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of {Contents[Edics]}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "242--243",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Nakashika and S. Takaki and J. Yamagishi",
  title =        "Complex-Valued Restricted {Boltzmann} Machine for
                 Speaker-Dependent Speech Parameterization From Complex
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "244--254",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Boltzmann machines; cepstral analysis; complex-valued
                 data; complex-valued representation; complex-valued
                 restricted Boltzmann machine; complex-valued spectra;
                 contrastive divergence; CRBM; deep learning; Feature
                 extraction; feature extraction; Gibbs sampling; hidden
                 Markov models; learning (artificial intelligence); Mel
                 frequency cepstral coefficient; Restricted Boltzmann
                 machine; signal classification; speaker-dependent
                 speech parameterization; speech processing; Speech
                 processing; Speech recognition; speech recognition;
                 speech signal processing; speech synthesis; Task

  author =       "F. Xiong and S. Goetze and B. Kollmeier and B. T.
  title =        "Joint Estimation of Reverberation Time and
                 Early-To-Late Reverberation Ratio From Single-Channel
                 Speech Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "255--267",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic characterization; acoustic observations;
                 acoustic room environment characterization; acoustic
                 signal processing; architectural acoustics; artificial
                 neural network; auditory-inspired acoustic features;
                 blind estimation methods; early-to-late reverberation
                 ratio; ELR classes; ELR estimation; ELR simultaneously;
                 Estimation; extreme reverberant conditions; Feature
                 extraction; joint estimation; joint room parameter
                 estimator; learning (artificial intelligence);
                 Modulation; multi-task learning; multitask learning;
                 neural nets; noisy environments; parameter estimation;
                 Reverberation; reverberation; Reverberation time;
                 reverberation time; signal representation;
                 single-channel speech signals; single-task ROPE system;
                 speech processing; Speech processing; speech
                 time-frequency representations; statistical
                 distributions; sub-band frequency data; subband
                 signals; temporal modulation features; temporal
                 modulation filtering; Time-frequency analysis",

  author =       "F. St{\"o}ter and S. Chakrabarty and B. Edler and E.
                 A. P. Habets",
  title =        "{CountNet}: Estimating the Number of Concurrent
                 Speakers Using Supervised Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "268--282",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio surveillance; audio-based tasks; blind source
                 separation; cocktail-party; complementary aspects;
                 concurrent speakers; convolutional recurrent neural
                 networks; deep architectures; deep neural network
                 architectures; discrete point estimates; Estimation;
                 learning (artificial intelligence); maximum number;
                 Microphones; Neural networks; number of concurrent
                 speakers; output posterior distributions; overlap
                 detection; probability; recurrent neural nets;
                 single-channel mixtures; Speaker count estimation;
                 speaker count estimation; speaker diarization; speech
                 mixtures; speech processing; Speech processing;
                 supervised learning; Surveillance; Task analysis;
                 unifying probabilistic paradigm",

  author =       "M. Kolb{\ae}k and Z. Tan and J. Jensen",
  title =        "On the Relationship Between Short-Time Objective
                 Intelligibility and Short-Time Spectral-Amplitude
                 Mean-Square Error for Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "283--295",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Auditory system; Correlation; correlation theory; deep
                 neural network based speech enhancement algorithms;
                 deep neural networks; DNN training criterion; DNN-based
                 speech enhancement algorithms; envelope linear
                 correlation; improved speech intelligibility
                 performance; least mean squares methods; mean-square
                 error criterion; minimum mean-square error estimator;
                 neural nets; Noise measurement; noisy speech;
                 short-time objective intelligibility; short-time
                 spectral amplitudes; short-time spectral-amplitude;
                 Signal processing algorithms; Speech enhancement;
                 speech enhancement; Speech enhancement; speech
                 intelligibility; speech temporal envelopes; standard
                 STSA minimum-MSE estimator; state-of-the-art speech
                 intelligibility estimator; STOI speech intelligibility
                 estimator; STSA-MSE criterion; Time-frequency

  author =       "M. W. Hansen and J. R. Jensen and M. G. Christensen",
  title =        "Estimation of Fundamental Frequencies in Stereophonic
                 Music Mixtures",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "296--310",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; audio signal processing;
                 Delays; Estimation; expectation-maximisation algorithm;
                 Frequency estimation; fundamental frequency estimation;
                 Gaussian sources; harmonic amplitude vectors; Harmonic
                 analysis; harmonic mixture components; instrument
                 recordings; Instruments; least squares approximations;
                 mixing parameters; model selection; multi-channel pitch
                 estimation; Multi-pitch estimation; multipitch
                 estimation problem; Multiple signal classification;
                 music; music information retrieval; overlapping
                 harmonics; panning parameters; pitch estimation
                 problem; recording studio; signal model; Speech
                 processing; stereophonic music mixtures; sterephonic
                 signal analysis; vector quantization",

  author =       "J. Bao and D. Tang and N. Duan and Z. Yan and M. Zhou
                 and T. Zhao",
  title =        "Text Generation From Tables",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "311--320",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "artificial intelligence; BLEU-4 scores; continuous
                 vectors; Decoding; descriptive sentences;
                 Encyclopedias; flexible copying mechanism; language
                 model based approaches; natural language processing;
                 natural language sentence; Natural languages; neural
                 generative model; neural nets; neural network; Neural
                 networks; search engine; Search engines; selective
                 content replication; SIMPLEQUESTIONS dataset; Speech
                 processing; table attributes; table caption; table
                 cells; table semantics; table-query pairs;
                 Table-to-text generation; Table2Seq; Table2Seq model;
                 Task analysis; text analysis; text generation; WIKIBIO
                 dataset; WIKITABLETEXT dataset",

  author =       "A. I. Koutrouvelis and R. C. Hendriks and R. Heusdens
                 and J. Jensen",
  title =        "A Convex Approximation of the Relaxed Binaural
                 Beamforming Optimization Problem",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "321--331",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustic distortion; acoustic signal processing;
                 acoustic sources; approximation theory; Array signal
                 processing; array signal processing; Binaural
                 beamforming; binaural cues; binaural-cue distortions;
                 binaural-cue preservation; computational complexity;
                 concave programming; convex approximation; Convex
                 functions; convex optimization; convex programming;
                 distortion; frequency bin; hybrid methods; LCMV; lower
                 computational complexity; multiple convex optimization
                 problems; Noise reduction; noise reduction; noise
                 suppression; nonconvex optimization problem;
                 Optimization; output noise power; predicted
                 intelligibility; RBB optimization problem; RBB problem;
                 relaxed binaural beamforming optimization problem; SCO
                 method; semi-definite relaxation; semidefinite convex
                 relaxation; single convex optimization problem;
                 suboptimal hybrid method; suboptimal method; suboptimal
                 SDCR method; successive convex optimization method;
                 Wiener filters",

  author =       "T. Hashimoto and D. Saito and N. Minematsu",
  title =        "Many-to-Many and Completely Parallel-Data-Free Voice
                 Conversion Based on Eigenspace {DNN}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "332--341",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Adaptation models; conversion model; Data models; deep
                 neural network; eigenspace DNN; eigenvalues and
                 eigenfunctions; eigenvoice; eigenvoice Gaussian mixture
                 models; Gaussian mixture model; Gaussian mixture
                 models; Gaussian processes; many-to-many conversion;
                 many-to-many voice conversion; mixture models; neural
                 nets; parallel processing; parallel-data-free;
                 parallel-data-free voice conversion; prestored parallel
                 data; pseudoparallel data; speaker features; speaker
                 recognition; speaker space; Speech processing; Task
                 analysis; Training; Voice conversion; voice conversion

  author =       "F. Pishdadian and B. Pardo",
  title =        "Multi-Resolution Common Fate Transform",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "342--354",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio signal processing; audio signal representation;
                 Audio source separation; audio sources; CFT; channel
                 bank filters; clusterability; fully invertible complex
                 time-frequency representation; high time-frequency
                 overlap; MCFT domain yield; Microsoft Windows;
                 Modulation; multi-resolution common fate transform;
                 multiple audio signals; multiresolution common fate
                 transform; multiresolution property; multiresolution
                 two-dimensional filter bank; resolution issue;
                 separability; signal representation; signal resolution;
                 source separation; Source separation; source signals;
                 state-of-the-art representation; Time-frequency
                 analysis; time-frequency analysis; time-frequency
                 domain; time-frequency signal representations;
                 Transforms; Two dimensional displays",

  author =       "Y. Wu and W. Li",
  title =        "Automatic Audio Chord Recognition With {MIDI}-Trained
                 Deep Feature and {BLSTM-CRF} Sequence Decoding Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "355--366",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; audio signal processing;
                 automatic audio chord recognition; Automatic chord
                 recognition; automatic chord recognition tasks;
                 bidirectional long short-term memory (BLSTM);
                 bidirectional long short-term memory conditional random
                 field; BLSTM-CRF sequence decoding model; chord
                 classification; chord recognition systems; CNN feature
                 extractor; conditional random fields (CRF);
                 convolution; convolutional neural network; data-driven
                 feature extraction; Decoding; deep feature extractor;
                 feature extraction; Feature extraction; feedforward
                 neural nets; hand-annotating time-synchronized chord
                 labels; Harmonic analysis; Hidden Markov models;
                 learning (artificial intelligence); machine learning
                 technologies; MIDI-trained deep feature; Music; music;
                 musical instrument digital interface; random processes;
                 real-world music audio recordings; recurrent neural
                 nets; signal classification; Training",

  author =       "K. Imoto and N. Ono",
  title =        "Acoustic Topic Model for Scene Analysis With
                 Intermittently Missing Observations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "367--382",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic observations; acoustic scene analysis;
                 Acoustic scene analysis; acoustic scenes; acoustic
                 signal processing; acoustic topic model; acoustic word
                 corresponds; acoustic word transition; Acoustics;
                 Analytical models; Data models; hidden Markov models;
                 Hidden Markov models; Image analysis; Markov model;
                 missing data analysis; missing observations; multiple
                 acoustic words; Privacy; Speech processing",

  author =       "K. Xiao and S. Wang and M. Wan and L. Wu",
  title =        "Reconstruction of {Mandarin} Electrolaryngeal
                 Fricatives With Hybrid Noise Source",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "383--391",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "abnormal source location; Acoustic analysis; acoustic
                 signal processing; Acoustics; Attenuation; Cutoff
                 frequency; EL fricative reconstruction; EL source; EL
                 speech production; electrolarynx; fricative
                 reconstruction; hybrid noise source; intelligibility;
                 Mandarin electrolaryngeal fricatives; Mandarin
                 electrolaryngeal speech; Mandarin fricatives; Position
                 measurement; Production; signal denoising; signal
                 reconstruction; speech enhancement; speech
                 intelligibility; Speech processing; transfer functions;
                 voice source; Wideband; wideband noise source",

  author =       "L. Krishnan and T. Betlehem and P. D. Teal",
  title =        "Fast Algorithms for Acoustic Impulse Response
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "392--403",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic impulse response shaping; acoustic signal
                 processing; Convergence; Dual Augmented Lagrangian
                 Method (DALM); fast algorithms; Fenchel conjugate;
                 Fenchel duality theorem; filtering theory; impulse
                 response shaping; Loudspeakers; Microphones;
                 microphones; Minimization; Reverberation;
                 reverberation; room acoustics; room compensation;
                 shaping algorithm; shaping filters; soft thresholding
                 function; Speech processing; transient response",

  author =       "V. Zakeri and A. J. Hodgson",
  title =        "Automatic Identification of Hard and Soft Bone Tissues
                 by Analyzing Drilling Sounds",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "404--414",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "biomedical ultrasonics; bone; bone drilling;
                 bone-drilling procedures; bone-out; bone-specific;
                 Bones; bovine tibial bones; Drilling machines; drilling
                 sound; Force; hard bone tissues; hidden Markov model;
                 hidden Markov models; logistic regression; machine
                 learning; Medical acoustics; medical signal processing;
                 random forest; regression analysis; soft bone tissues;
                 sound signals; Speech processing; support vector
                 machine; support vector machines; Support vector
                 machines; Surgery; surgery; surgical drill; tissue
                 identification; Tools; wavelet packet transform
                 coefficients; wavelet transforms",

  author =       "S. Bilbao and B. Hamilton",
  title =        "Directional Sources in Wave-Based Acoustic
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "415--428",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustics; approximants; approximation theory;
                 arbitrary directivity; complete solution; detailed
                 modeling; directional character; directional sources;
                 finite difference time domain method; finite difference
                 time domain setting; finite difference time-domain
                 analysis; interpolation; Mathematical model; multipole
                 modeling; Numerical models; point sources; Propagation;
                 Room acoustics; Solid modeling; source modeling;
                 spatial Fourier-based approximation strategy; spatial
                 grid; spatio-temporal domain; Three-dimensional
                 displays; three-dimensional wave equation; Time-domain
                 analysis; underlying grid; volumetric wave-based
                 acoustic simulation; wave equations",

  author =       "Y. Zhang and B. Pardo and Z. Duan",
  title =        "{Siamese} Style Convolutional Neural Networks for
                 Sound Search by Vocal Imitation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "429--441",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio content; audio feature representations; audio
                 signal processing; convolution; Convolutional neural
                 networks; Databases; encoded features; environmental
                 sound classification; Feature extraction; feature
                 extraction; feedforward neural nets; fully connected
                 network; IMINET; imitation encoder; information
                 retrieval; learning (artificial intelligence); metric
                 learning; Neurons; original sound encoder; Poles and
                 towers; query processing; Siamese style convolutional
                 neural networks; similarity measures; sound search;
                 Speech processing; spoken language recognition; Task
                 analysis; TL-IMINET; transfer learning; unified
                 end-to-end training framework; vocal imitation; Vocal

  author =       "F. Feng and M. Kowalski",
  title =        "Underdetermined Reverberant Blind Source Separation:
                 Sparse Approaches for Multiplicative and Convolutive
                 Narrowband Approximation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "442--456",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Approximation algorithms; approximation theory; blind
                 source separation; Blind source separation; convergence
                 of numerical methods; convergence proof; convolution;
                 convolutive narrowband approximation; Covariance
                 matrices; expectation-maximisation algorithm; Fourier
                 transforms; live recorded mixtures; Manganese;
                 multiplicative narrowband approximation; Narrowband;
                 optimisation; Optimization; optimization framework;
                 optimization problems; reverberant mixtures;
                 reverberation; room impulse response; separation
                 problem; short-time-Fourier-transform; signal
                 representation; sparse component analysis; sparse
                 source signal representation; synthesized recorded
                 mixtures; Time-frequency analysis; time-frequency
                 domain; underdetermined convolutive mixtures;
                 underdetermined reverberant blind source separation",

  author =       "Z. Wang and D. Wang",
  title =        "Combining Spectral and Spatial Features for Deep
                 Learning Based Blind Speaker Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "457--468",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; array signal processing;
                 Array signal processing; beamforming; blind source
                 separation; blind speaker separation; chimera++
                 networks; complementary spectral features; deep
                 clustering; deep learning; direction estimation;
                 enhancement network; estimated direction; Geometry;
                 individual speakers; input feature level; learning
                 (artificial intelligence); Microphone arrays;
                 microphone geometry; microphones; multichannel speaker
                 separation; objective function level; permutation
                 invariant training; reverberant environments;
                 reverberant speaker mixtures; reverberant
                 talker-independent speaker separation; reverberation;
                 source separation; Spatial features; spatial features;
                 speaker recognition; specific spectral structures;
                 Speech processing; strong separation performance; T-F
                 unit level speaker dominance; trained models; Training;
                 two-channel chimera",

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "2",
  pages =        "C3--C3",
  month =        feb,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "C1--469",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "C2--C2",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of {Contents[Edics]}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "470--471",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "M. Z. Jahromi and A. Zahedi and J. Jensen and J.
  title =        "Information Loss in the Human Auditory System",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "472--481",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic stimuli; Acoustics; auditory cortex; Auditory
                 system; Brain modeling; closed-vocabulary
                 intelligibility test; decoding; Gaussian mixture model;
                 Gaussian processes; hearing; Human auditory system;
                 human listener; human word recognition rate;
                 information loss; information theoretic tools; machine
                 classifier; maximum likelihood classifier; mutual
                 information; Noise measurement; optimal classifiers;
                 Oral communication; pattern classification; Signal to
                 noise ratio; signal to noise ratio; SNR; speech
                 communication model; speech processing; Speech
                 recognition; speech recognition;
                 speech-in-stationary-noise setup; vocabulary",

  author =       "Y. Buchris and A. Amar and J. Benesty and I. Cohen",
  title =        "Incoherent Synthesis of Sparse Arrays for
                 Frequency-Invariant Beamforming",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "482--495",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "array signal processing; Array signal processing;
                 audio acoustics; Bandwidth; beamformer coefficients;
                 Broadband communication; coherent sparse approach;
                 differential microphone arrays; dimensionality
                 clustering; dimensionality reduction; directivity
                 factor; frequency bin; Frequency-invariant beamformer;
                 frequency-invariant beamformers; frequency-invariant
                 beamforming; incoherent approach; incoherent sparse
                 design; incoherent synthesis; microphone arrays;
                 optimal sensors; Optimization; planar superdirective
                 array designs; Robustness; Sensor arrays; sensors
                 positions; signal waveform distortions; sparse array
                 layout; sparse arrays; sparse design; sparse designs;
                 sparse linear array designs; sparse set; superdirective
                 beamformers; underwater acoustics; uniform array
                 design; uniform arrays; white noise; white noise gain",

  author =       "Y. Rahulamathavan and K. R. Sutharsini and I. G. Ray
                 and R. Lu and M. Rajarajan",
  title =        "Privacy-Preserving {$i$Vector}-Based Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "496--506",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "authentication; Bioinformatics; Cryptography; Data
                 privacy; data privacy; Feature extraction; iVector;
                 iVector-based voice verification technique; linear
                 discriminant analysis; linear discriminant analysis
                 techniques; Privacy; privacy-preserving iVector-based
                 speaker verification; privacy-preserving voice
                 verification; random domain; randomized domain;
                 security; Servers; speaker recognition; speech; voice

  author =       "J. Zhang and Y. Zhao and H. Li and C. Zong",
  title =        "Attention With Sparsity Regularization for Neural
                 Machine Translation and Summarization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "507--518",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "abstractive summarization; attention mechanism;
                 attention weight distribution; de facto standard
                 component; Decoding; Entropy; entropy; final attention
                 distribution; input sentence; language translation;
                 Linear programming; machine translation; minimum
                 entropy regularization; neural machine translation;
                 neural nets; neural sequence; output sequence; relevant
                 input words; sequence tasks; Sequence to sequence
                 learning; sparse attention model; sparsity
                 regularization; sparsity regularization term; Speech
                 processing; Standards; summarization; Task analysis;
                 Training; visual perception",

  author =       "A. H. Moore and W. Xue and P. A. Naylor and M.
  title =        "Noise Covariance Matrix Estimation for Rotating
                 Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "519--530",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustic noise; adaptive estimation; array manifold;
                 array orientation; array rotation; array signal
                 processing; beamformers; covariance matrices;
                 Covariance matrices; Covariance matrix estimation;
                 desired source activity; estimated covariance matrix;
                 Estimation; estimation theory; ground truth noise
                 covariance matrix; Harmonic analysis; head-mounted
                 arrays; Indexes; microphone array; Microphone arrays;
                 microphone arrays; microphone signal covariance;
                 microphones; minimum variance distortionless response
                 beamformer; moving microphone array; noise covariance
                 matrix estimation; noise dereverberation; noise field;
                 noise figure 0.05 dB; noise figure 18.0 dB; noise
                 reduction performance; noise suppression; noise-only
                 segments; parametric model; spatial filtering; spatial
                 filters; spherical harmonic analysis; stored model

  author =       "G. Yang and H. He and Q. Chen",
  title =        "Emotion-Semantic-Enhanced Neural Network",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "531--543",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Computational modeling; convolution neural network;
                 convolutional neural nets; deep learning; ECNN;
                 emoticons; emoticons projections; emotion recognition;
                 emotion-semantic-enhanced convolutional neural network
                 model; emotional signals; emotional space projection
                 operator; Feature extraction; feature representation
                 matrix; learning (artificial intelligence); matrix
                 algebra; microblog sentimental analysis; Natural
                 language processing; natural language processing tasks;
                 pattern classification; Semantics; Sentiment analysis;
                 sentiment analysis; social networking (online); Task

  author =       "T. Dietzen and A. Spriet and W. Tirry and S. Doclo and
                 M. Moonen and T. {van Waterschoot}",
  title =        "Comparative Analysis of Generalized Sidelobe
                 Cancellation and Multi-Channel Linear Prediction for
                 Speech Dereverberation and Noise Reduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "544--558",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "array signal processing; Array signal processing;
                 blind speech dereverberation; comparative analysis;
                 data-dependent beamforming; deconvolution; Delays;
                 dereverberation; early reverberant-speech component;
                 Fourier transforms; generalized sidelobe canceler
                 framework; generalized sidelobe cancellation; GSC
                 blocking matrix; GSC framework; incoherent-noise
                 components; MCLP framework; microphones; Microphones;
                 Multi-channel linear prediction; multichannel linear
                 prediction framework; noise reduction; Noise reduction;
                 noise reduction; reverberation; speech enhancement;
                 Speech processing; time domain simulation results;
                 Time-domain analysis",

  author =       "J. Gao and J. Du and E. Chen",
  title =        "Mixed-Bandwidth Cross-Channel Speech Recognition via
                 Joint Optimization of {DNN}-Based Bandwidth Expansion
                 and Acoustic Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "559--571",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic features; acoustic modeling; Acoustics;
                 automatic speech recognition systems; average relative
                 word error rate reduction; bandwidth expansion;
                 bandwidth expansion networks; bandwidth-dependent
                 models; conventional multiple acoustic models; Data
                 models; Deep neural network; deep neural network-based
                 bandwidth expansion; different recording channels;
                 direct mapping DNN; diversified cross-channel speech
                 data; diversified speech data; diversified training
                 data; DNN-based acoustic models; DNN-based bandwidth
                 expansion; DNN-DM; feature extraction; general
                 framework; Hidden Markov models; highest sampling rate;
                 intermediate target layers; joint optimization; joint
                 training strategies; large-scale Mandarin speech
                 datasets; learning (artificial intelligence); low
                 sampling rates; mixed-bandwidth cross-channel speech
                 recognition; mixed-bandwidth speech recognition;
                 multiple bandwidths; multitask training; Narrowband;
                 neural nets; novel DNN architectures; progressive
                 mapping; progressive stacking network; scene related
                 speech data; specific sampling rate; Speech
                 recognition; speech recognition; transmission channels;
                 unified model; Wideband",

  author =       "S. Deena and M. Hasan and M. Doulaty and O. Saz and T.
  title =        "Recurrent Neural Network Language Model Adaptation for
                 Multi-Genre Broadcast Speech Recognition and
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "572--582",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Adaptation models; automatic speech recognition;
                 Context modeling; Data models; feature-based adaptation
                 layer; feature-based RNNLMs; hybrid adaptation
                 techniques; language model adaptation; linear hidden
                 network adaptation layer; multi-domain ASR; multigenre
                 broadcast speech recognition; n-gram language models;
                 recurrent neural nets; recurrent neural network
                 language model adaptation; recurrent neural network
                 language models; RNNLM; RNNLM adaptation techniques;
                 Speech processing; Speech recognition; speech
                 recognition; Speech recognition; Task analysis;

  author =       "F. B. Gelderblom and T. V. Tronstad and E. M. Viggen",
  title =        "Subjective Evaluation of a Noise-Reduced Training
                 Target for Deep Neural Network-Based Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "583--594",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "artificial neural networks; deep neural network;
                 Degradation; neural nets; Neural networks; Noise
                 measurement; noise-reduced training target; noisy
                 speech; POLQA; Signal to noise ratio; speech
                 distortion; Speech enhancement; speech enhancement;
                 speech enhancement systems; speech intelligibility;
                 speech processing; speech quality; speech recognition;
                 speech recognition test; subjective evaluation;

  author =       "M. Luis Valero and E. A. P. Habets",
  title =        "Low-Complexity Multi-Microphone Acoustic Echo Control
                 in the Short-Time {Fourier} Transform Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "595--609",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic coupling; acoustic signal processing;
                 Acoustics; array signal processing; background noise;
                 Convergence; desired near-end speech; echo suppression;
                 echo-to-noise ratio; Estimation; far-end signal;
                 Fourier transforms; high-quality end-to-end
                 communication; loudspeaker; loudspeakers;
                 low-complexity MM-AEC; low-complexity multimicrophone
                 echo controller; microphones; Microphones; modern
                 communication; Multi-microphone acoustic echo control;
                 multi-microphone noise reduction; multimicrophone
                 acoustic echo cancellation techniques; multimicrophone
                 acoustic echo control; multimicrophone speech; near-end
                 room; Noise measurement; relative transfer function
                 estimation; residual echo reduction; short-time Fourier
                 transform; smart devices; speech enhancement; Speech
                 processing; speech processing; Steady-state",

  author =       "Q. Zhu and P. Coleman and X. Qiu and M. Wu and J. Yang
                 and I. Burnett",
  title =        "Robust Personal Audio Geometry Optimization in the
                 {SVD}-Based Modal Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "610--620",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic contrast control; acoustic signal processing;
                 Acoustics; audio signal processing; broadband
                 equalization; equalisers; Geometry; geometry
                 optimization method; interference; listening zone;
                 Loudspeakers; loudspeakers; natural sound reproduction;
                 optimisation; Optimization; personal audio geometry
                 optimization; personalized listening experiences;
                 planarity control; pressure matching; private listening
                 experiences; quiet zone; regularization; Robustness;
                 robustness; shared space sound zones; singular value
                 decomposition; sound reproduction; sound reproduction
                 perturbations; sound zones; Spatial audio; SVD-based
                 modal domain; system geometry; Transfer functions;

  author =       "J. Yi and J. Tao and Z. Wen and Y. Bai",
  title =        "Language-Adversarial Transfer Learning for
                 Low-Resource Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "621--630",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic model; Acoustics; Adaptation models;
                 adversarial learning; adversarial SHL-model;
                 Adversarial training; cross-lingual; Knowledge
                 transfer; language invariant features;
                 language-adversarial transfer learning; learning
                 (artificial intelligence); Learning systems; low
                 resource conditions; low-resource; Neural networks;
                 shared features; shared hidden layer model; speech
                 recognition; Speech recognition; speech recognition;
                 target language; target model; Training; transfer
                 learning; unnecessary language dependent information",

  author =       "J. Zhang and Z. Ling and L. Liu and Y. Jiang and L.
  title =        "Sequence-to-Sequence Acoustic Modeling for Voice
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "631--644",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic features; acoustic models; Acoustics;
                 appropriate duration conversion; attention; automatic
                 speech recognition model; Cloning; conversion stage;
                 Decoding; deep neural networks; Feature extraction;
                 feature extraction; feature sequences; Gaussian mixture
                 models; Gaussian processes; Linguistics; Mel-scale
                 spectrograms; Mel-spectrogram; Mel-spectrograms; neural
                 nets; SCENT model; sequence-to-sequence;
                 sequence-to-sequence acoustic modeling;
                 sequence-to-sequence ConvErsion NeTwork; source speech;
                 source utterances; Speech processing; speech
                 recognition; speech signals; target speakers; training
                 stage; unified acoustic model; vocal tract
                 descriptions; Vocoders; vocoders; Voice conversion;
                 Voice Conversion Challenge 2018",

  author =       "X. Li and L. Girin and S. Gannot and R. Horaud",
  title =        "Multichannel Speech Separation and Enhancement Using
                 the Convolutive Transfer Function",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "645--659",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "1-norm minimization; 2-norm fitting cost;
                 approximation theory; array signal processing; Audio
                 source separation; basis pursuit method;
                 beamforming-like multichannel inverse filtering method;
                 computational cost; Convolution; convolutive transfer
                 function; convolutive transfer function approximation;
                 CTF domain; filter perturbations; filtering theory;
                 Fourier transforms; Lasso optimization; microphone
                 signals; microphones; Microphones; minimisation; MINT;
                 mixing filters; mixing model; multichannel convolutive
                 mixtures; multichannel speech enhancement; multichannel
                 speech separation; multiple input-output inverse
                 theorem; noise power level; noisy mixtures; power
                 minimization; reverberation; short-time Fourier
                 transform; short-time Fourier transform domain;
                 single-source MINT; Source separation; source
                 separation; spectral sparsity; speech enhancement;
                 Speech enhancement; Time-domain analysis; time-domain
                 filters; time-domain inverse filters; time-domain
                 Lasso; transfer functions; Transfer functions",

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "3",
  pages =        "C3--C3",
  month =        mar,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "C1--660",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "C2--C2",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of {Contents[Edics]}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "661--662",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Z. Zhao and H. Liu and T. Fingscheidt",
  title =        "Convolutional Neural Networks to Enhance Coded
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "663--678",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "adaptive codes; adaptive multirate wideband codec;
                 category rating listening testing; cepstral analysis;
                 Cepstral analysis; cepstral domain feature approach;
                 CMOS integrated circuits; CMOS points; coded speech
                 enhancement; convolutional codes; convolutional neural
                 nets; convolutional neural networks; Convolutional
                 neural networks; far-end acoustic background noise;
                 G.711-coded speech; ITU-T-standardized postfilter;
                 narrowband speech codecs; Noise measurement;
                 postprocessing approaches; Quantization (signal);
                 quantization noise; Signal to noise ratio; speech
                 codecs; speech coding; Speech coding; Speech
                 enhancement; speech enhancement; speech quality
                 evaluation; statistical analysis; statistical
                 significance; time domain approaches; time-domain
                 analysis; time-domain approach; transmission errors;
                 uncoded speech; wideband speech codecs",

  author =       "H. Schepker and S. E. Nordholm and L. T. T. Tran and
                 S. Doclo",
  title =        "Null-Steering Beamformer-Based Feedback Cancellation
                 for Multi-Microphone Hearing Aids With Incoming Signal
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "679--691",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic feedback; Acoustic feedback cancellation;
                 acoustic feedback paths; acoustic signal processing;
                 Acoustics; adaptive filter; adaptive filters; array
                 signal processing; biased optimal solution; closed-loop
                 acoustical system; fixed beamformer; hearing aid
                 loudspeaker; Hearing aids; hearing aids; incoming
                 signal directions; incoming signal preservation; least
                 squares approximations; least-squares optimization;
                 least-squares optimization procedure; Loudspeakers;
                 loudspeakers; microphones; Microphones; min-max
                 optimization; min-max optimization procedure; minimax
                 techniques; multimicrophone hearing aids; multiple
                 integrated microphones; null-steering; null-steering
                 beamformer-based feedback cancellation; Optimization;
                 perfect feedback cancellation; residual feedback power;
                 Speech processing; transfer functions; Transfer

  author =       "Z. Li and Y. Song and L. Dai and I. McLoughlin",
  title =        "Listening and Grouping: an Online Autoregressive
                 Approach for Monaural Speech Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "692--703",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "autoregressive processes; causal temporal context;
                 closed-set evaluation; computational auditory scene
                 analysis; deep learning; Deep learning; deep learning
                 power; Extraterrestrial measurements; frame levels;
                 grouping architecture; grouping stage; Image analysis;
                 label permutation problem; learned listening; learning
                 (artificial intelligence); multispeaker monaural speech
                 separation; Neural networks; online autoregressive
                 approach; open-set evaluation; segment levels;
                 signal-to-distortion ratio; Speech processing; speech
                 quality scores; speech recognition; Speech separation;
                 Task analysis; Training; WSJ0-2mix benchmark",

  author =       "D. Deng and L. Jing and J. Yu and S. Sun and M. K.
  title =        "Sentiment Lexicon Construction With Hierarchical
                 Supervision Topic Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "704--718",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "data mining; hierarchical supervision information;
                 hierarchical supervision topic model; Modeling; Motion
                 pictures; multinomial distribution; Neural networks;
                 opinion mining; pattern classification; Probabilistic
                 logic; probability; Sentiment analysis; sentiment
                 analysis; Sentiment analysis; sentiment analysis;
                 sentiment classification; sentiment lexicon
                 construction; Speech processing; Sun; text mining;
                 topic model; topic-adaptive sentiment lexicon",

  author =       "M. Zhou and M. Huang and X. Zhu",
  title =        "Story Ending Selection by Finding Hints From Pairwise
                 Candidate Endings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "719--729",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "commonsense reasoning; Computational modeling; Context
                 modeling; ending vector prediction; evidence bias
                 issue; four-sentence story context; humanities; Machine
                 reading comprehension; machine reading comprehension;
                 natural language processing; Natural languages; neural
                 nets; neural networks; pairwise candidate endings;
                 Predictive models; query processing; Semantics; Speech
                 processing; Story Cloze Test; story comprehension;
                 story ending selection; Task analysis; vectors",

  author =       "J. Richter and J. Fels",
  title =        "On the Influence of Continuous Subject Rotation During
                 High-Resolution Head-Related Transfer Function
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "730--741",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustic measurements; acoustic signal processing;
                 artificial head; audible influence; audio signal
                 processing; continuous measurement rotation; continuous
                 rotation; continuous subject rotation; HRTF
                 measurement; individual head-related transfer function;
                 Interpolation; interpolation; loudspeaker arrays;
                 loudspeakers; Loudspeakers; loudspeakers; measurement
                 signals; microphone arrays; objective comparison;
                 Position measurement; position measurement; Rotation
                 measurement; rotation measurement; rotation speed;
                 rotation speeds; Signal resolution; signal resolution;
                 sine sweep measurements; step-wise measurement
                 rotation; step-wise subject positioning; subjective
                 comparison; subjective listening experiment; Time
                 measurement; time measurement; transfer functions",

  author =       "J. Yu and K. Markov and T. Matsui",
  title =        "Articulatory and Spectrum Information Fusion Based on
                 Deep Recurrent Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "742--752",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic features; acoustic model DNN;
                 acoustic-to-articulatory inversion; Acoustics; AM DNN
                 training; articulatory features; articulatory
                 information; articulatory inversion DNN; Automatic
                 speech recognition; automatic speech recognition
                 systems; Computational modeling; Data models; deep
                 neural networks-hidden Markov model hybrid; deep
                 recurrent neural networks; distillation training; DNN
                 acoustic model; feature-based approach; feature-based
                 method; Hidden Markov models; hidden Markov models;
                 model-based approach; model-based method; phoneme
                 recognition system; recognition time; recurrent neural
                 nets; speech processing; Speech processing; Speech
                 recognition; speech recognition; Training; underlying
                 acoustic model",

  author =       "F. P. Itturriet and M. H. Costa",
  title =        "Perceptually Relevant Preservation of Interaural Time
                 Differences in Binaural Hearing Aids",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "753--764",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic noise; acoustic signal processing; aid
                 designers; binaural; binaural hearing aids; Cost
                 function; developed MWF-ITD technique; diffuse noise
                 fields; directional acoustic noise source; directional
                 noise source; Ear; Hearing aids; hearing aids;
                 Integrated circuits; interaural coherence concept;
                 interaural phase difference; interaural time
                 difference; ITD binaural cues; ITD subjective
                 perception; microphones; Microphones; multichannel
                 Wiener filter; MWF-IC technique; noise reduction; noise
                 reduction method; noise reduction technique; original
                 IC magnitude; processed noise; residual noise spatial
                 preservation; signal denoising; spatial subjective
                 sensation; speech processing; Wiener filter; Wiener

  author =       "J. Abel and T. Fingscheidt",
  title =        "Sinusoidal-Based Lowband Synthesis for Artificial
                 Speech Bandwidth Extension",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "765--776",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic bandwidth; artificial speech bandwidth
                 extension; Artificial speech bandwidth extension; CMOS
                 points; conventional narrowband telephony; Estimation;
                 Frequency estimation; Harmonic analysis; Hidden Markov
                 models; high-frequency components; instrumental quality
                 assessment; low-frequency band; lowband; NB speech;
                 sinusoidal; spectral analysis; spectrally balanced
                 speech signals; Speech coding; speech coding; speech
                 enhancement; Speech enhancement; speech
                 intelligibility; speech processing; speech quality;
                 speech synthesis",

  author =       "Q. Kong and Y. Xu and I. Sobieraj and W. Wang and M.
                 D. Plumbley",
  title =        "Sound Event Detection and Time Frequency Segmentation
                 from Weakly Labelled Data",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "777--787",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal detection; acoustic signal processing;
                 audio signal processing; classification mapping;
                 convolutional neural network; Convolutional neural
                 networks; DCASE 2018 Task 2 sound events data; Event
                 detection; feature extraction; learning (artificial
                 intelligence); neural nets; probability; segmentation
                 mapping; Sound event detection; sound event detection;
                 Spectrogram; speech recognition; supervised SED
                 algorithms; T-F segmentation masks; Tagging; Task
                 analysis; Time-frequency analysis; time-frequency
                 segmentation; Training; weakly labelled data",

  author =       "Y. Tuan and H. Lee",
  title =        "Improving Conditional Sequence Generative Adversarial
                 Networks by Stepwise Evaluation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "788--798",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "chit-chat dialogue generation; computational costs;
                 conditional sequence generation tasks; conditional
                 sequence generative adversarial networks; Decoding;
                 Gallium nitride; Generative adversarial network;
                 Generative adversarial networks; Generators;
                 interactive systems; Maximum likelihood estimation;
                 MCTS; Monte Carlo methods; Monte Carlo tree search;
                 neural nets; REGS; SeqGAN; sequence generation;
                 StepGAN; stepwise evaluation; stepwise GAN; Task
                 analysis; Training; tree searching",

  author =       "N. Dionelis and M. Brookes",
  title =        "Modulation-Domain {Kalman} Filtering for Monaural
                 Blind Speech Denoising and Dereverberation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "799--814",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "adaptive algorithm; adaptive filters; blind joint
                 denoising; dereverberation; direct-to-reverberant
                 energy ratio; DRR; interframe speech dynamics; Kalman
                 filter update step models; Kalman filtering; Kalman
                 filters; log-magnitude spectrum; minimum mean-square
                 error (MMSE) estimation; modulation; modulation-domain
                 Kalman filtering; monaural blind speech denoising;
                 monaural blind speech dereverberation; monaural speech
                 enhancement algorithm; Noise measurement; Noise
                 reduction; noisy reverberant speech; posterior
                 distribution estimation; reverberant speech to noise
                 ratios; reverberation; Reverberation; reverberation
                 time T60 parameters; signal denoising; Speech
                 enhancement; speech enhancement; Speech enhancement;
                 speech intelligibility; speech intelligibility quality;
                 speech log-magnitude spectrum estimation;
                 Time-frequency analysis; time-frequency log-magnitude

  author =       "R. Lotfian and C. Busso",
  title =        "Curriculum Learning for Speech Emotion Recognition
                 From Crowdsourced Labels",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "815--826",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "classification task; Computers; crowdsourced labels;
                 curriculum learning; Curriculum learning; deep neural
                 networks; DNNs; emotion perception; emotion
                 recognition; Emotion recognition; emotional content;
                 human judgments; inter-evaluator agreement; learning
                 (artificial intelligence); Machine learning; machine
                 learning problems; multiclass classification; neural
                 nets; pattern classification; regression analysis;
                 regression problems; speech emotion recognition; Speech
                 processing; Speech recognition; speech recognition;
                 speech samples; Task analysis; Training",

  author =       "S. Lin",
  title =        "Robust Pitch Estimation and Tracking For Speakers
                 Based on Subband Encoding and The Generalized Labeled
                 Multi-{Bernoulli} Filter",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "827--841",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "additive noise; auditory filterbank; autocorrelation;
                 CASA; channel bank filters; computational auditory
                 scene analysis approach; correlation methods;
                 Estimation; estimation theory; frequency coverage;
                 frequency coverage metric; Frequency estimation;
                 generalized labeled multiBernoulli filter; GLMB
                 tracking filter; Harmonic analysis; Hidden Markov
                 models; measurement driven birth; measurement-driven
                 birth model; normalized autocorrelation calculation;
                 Ornstein Uhlenbeck process; Ornstein-Uhlenbeck process;
                 pitch state transition model; Pitch tracking; robust
                 pitch estimation methods; robust pitch tracker; sound
                 signal decomposition; speaker estimation; speaker
                 recognition; speaker tracking; speech coding; Speech
                 processing; spurious error suppression; subband
                 encoding; subband signals; Target tracking; temporal
                 continuity constraint; time-frequency analysis;
                 Time-frequency analysis; time-frequency sparsity",

  author =       "X. Wang and I. Cohen and J. Chen and J. Benesty",
  title =        "On Robust and High Directive Beamforming With
                 Small-Spacing Microphone Arrays for Scattered Sources",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "842--852",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic radiators; acoustic wave scattering;
                 Acoustics; Array signal processing; array signal
                 processing; broadband acoustic source processing;
                 diffuse noise gain; diffuse noise suppression;
                 directional noise suppression; frequency-invariant
                 beamformer; generalized MDNG beamformer; joint
                 diagonalization technique; low white noise gain;
                 maximum diffuse noise gain beamformer; maximum WNG
                 beamformer; Microphone array; microphone arrays;
                 Microphone arrays; MWNG beamformer; robust high
                 directive beamforming; scattered acoustic source
                 processing; scattered source; Sensor arrays;
                 small-spacing microphone arrays; White noise; white
                 noise; white noise gain",

  author =       "Z. Quan and Z. Wang and Y. Le and B. Yao and K. Li and
                 J. Yin",
  title =        "An Efficient Framework for Sentence Similarity
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "853--865",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "attention constituency vector tree; attention weight;
                 attention weight mechanisms; Kernel; Natural language
                 processing; natural language processing; natural
                 language processing applications; neural network
                 methods; Neural networks; semantic information;
                 semantic textual similarity datasets; Semantics;
                 sentence embedding; Sentence similarity; sentence
                 similarity measure; sentence similarity modeling;
                 Speech processing; structured trees; syntactic
                 information; syntactic structure; Syntactics; text
                 analysis; tree kernel; trees (mathematics); Vegetation;
                 word embedding; word embedding techniques",

  author =       "N. Lubis and S. Sakti and K. Yoshino and S. Nakamura",
  title =        "Positive Emotion Elicitation in Chat-Based Dialogue
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "866--877",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Affective computing; affective computing; affective
                 dialogue systems; Appraisal; chat-based dialogue
                 system; chat-based dialogue systems; Crowdsourcing;
                 Databases; dialogue corpus; dialogue system
                 interaction; elicit positive emotion; emotion
                 appraisal; emotion elicitation; emotion recognition;
                 Emotion recognition; emotion-rich corpora;
                 emotion-sensitive neural chat-based dialogue system;
                 emotional benefit; emotional support; human computer
                 interaction; information retrieval; interactive
                 systems; Natural language processing; natural language
                 processing; neural nets; Neural networks; neural
                 networks; positive emotion elicitation corpus; positive
                 emotional response; positive emotional states; positive
                 emotional valence; Speech processing",

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "4",
  pages =        "C3--C3",
  month =        apr,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "5",
  pages =        "C1--878",
  month =        may,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "5",
  pages =        "C2--C2",
  month =        may,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "5",
  pages =        "879--880",
  month =        may,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "F. J. Ibarrola and R. D. Spies and L. E. D. Persia",
  title =        "Switching Divergences for Spectral Learning in Blind
                 Speech Dereverberation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "5",
  pages =        "881--891",
  month =        may,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "artificial reverberation; Atomic measurements; audio
                 quality; audio signal processing; blind speech
                 dereverberation; Cost function; cost function
                 minimization; dereverberation; Dictionaries; dictionary
                 learning; enclosed room; fidelity term; Frequency
                 measurement; generalized -divergence; human computer
                 interaction; human-machine interaction technologies;
                 learning (artificial intelligence); nonnegative
                 representation; observed spectrogram; optimal fidelity
                 parameter; penalization; real recordings;
                 reverberation; Reverberation; reverberation model;
                 Signal processing; signal representation; sound signal;
                 spectral learning; spectral structure; Spectrogram;
                 speech processing; Speech processing; two-stage
                 dereverberation approach",

  author =       "I. Cohen and J. Benesty and J. Chen",
  title =        "Differential {Kronecker} Product Beamforming",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "5",
  pages =        "892--902",
  month =        may,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustic arrays; Acoustics; array signal processing;
                 Array signal processing; beampattern; Covariance
                 matrices; Differential beamforming; differential
                 Kronecker product beamformers; differential Kronecker
                 product beamforming; directivity factor; front-to-back
                 ratio; Kronecker product; Kronecker product
                 decomposition; Kronecker product formulation;
                 microphone array; microphone arrays; Microphone arrays;
                 steering vector; superdirective beamforming; tradeoff
                 control; vectors; virtual arrays; white noise; White
                 noise; white noise gain",

  author =       "C. Elisei-Iliescu and C. Paleologu and J. Benesty and
                 C. Stanciu and C. Anghel and S. Ciochin{\u{a}}",
  title =        "Recursive Least-Squares Algorithms for the
                 Identification of Low-Rank Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "5",
  pages =        "903--918",
  month =        may,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Adaptive filter; adaptive filters; Adaptive systems;
                 Approximation algorithms; Complexity theory;
                 computationally efficient versions; Convergence;
                 convergence/tracking capabilities; DCD iterations;
                 dichotomous coordinate descent iterations; echo
                 cancellation; Echo cancellers; echo suppression; fast
                 convergence rate; FIR filters; gradient methods;
                 high-dimension system identification problem; impulse
                 response decomposition; iterative methods; least mean
                 squares methods; least squares approximations; long
                 length adaptive filters; long length impulse responses;
                 low-dimension problems; low-rank approximation;
                 low-rank systems identification; Matrix decomposition;
                 nearest Kronecker product; QR decomposition techniques;
                 recursive least-squares (RLS) algorithm; recursive
                 least-squares algorithms; regularization; RLS
                 algorithm; Speech processing; system identification;
                 system identification problems; Wiener filter; Wiener

  author =       "A. Kumar and T. Guha and P. K. Ghosh",
  title =        "{Dirichlet} Latent Variable Model: a Dynamic Model
                 Based on {Dirichlet} Prior for Audio Processing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "5",
  pages =        "919--931",
  month =        may,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio processing applications; audio signal
                 processing; Data models; Dirichlet distribution;
                 Dirichlet latent variable model; dynamic Dirichlet;
                 dynamic latent variable model; dynamic parameters;
                 expectation-maximisation algorithm; exponential family
                 distributions; Hidden Markov models; Latent variable
                 model; learning (artificial intelligence); NMF; NMF
                 dynamic version; non negative; nonnegative matrix
                 factorization; probabilistic latent component analysis;
                 Probabilistic logic; Signal processing algorithms;
                 source separation; Source separation; speaker source
                 separation; Speech processing; time varying",

  author =       "P. Jancovic and M. K{\"o}k{\"u}er",
  title =        "Bird Species Recognition Using Unsupervised Modeling
                 of Individual Vocalization Elements",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "5",
  pages =        "932--947",
  month =        may,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic modeling; acoustic models; acoustic scene;
                 acoustic signal detection; acoustic signal processing;
                 Acoustics; audio field recordings; audio recording;
                 audio signal processing; bioacoustics; biology
                 computing; bird species identification; bird species
                 recognition; Bird species recognition; bird
                 vocalization elements; Birds; DNN-HMM; element models;
                 Feature extraction; field recording; hidden Markov
                 model; hidden Markov models; Hidden Markov models;
                 hybrid deep neural network-hidden Markov model;
                 iterative maximum likelihood label re-assignment
                 procedure; maximum likelihood estimation; multiple bird
                 species; neural nets; Noise measurement; nonbird sound
                 recordings; normalized magnitude values;
                 postrecognition stage; recognition accuracy;
                 segmentation; signal classification; sinusoid; sound
                 field recordings; Speech processing; Speech
                 recognition; speech recognition; state duration
                 modeling; unsupervised; unsupervised modeling;
                 vocalisation element",

  author =       "T. Koriyama and T. Kobayashi",
  title =        "Statistical Parametric Speech Synthesis Using Deep
                 {Gaussian} Processes",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "5",
  pages =        "948--959",
  month =        may,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "approximation method; approximation theory; Bayes
                 methods; Bayesian model; contextual features;
                 conventional framework; deep architecture model; deep
                 Gaussian processes; deep neural network-based speech
                 synthesis; DGP framework; doubly stochastic variational
                 inference; feedforward DNN-based method; Gaussian
                 process; Gaussian processes; Global Positioning System;
                 Hidden Markov models; Kernel; learning (artificial
                 intelligence); model complexity; neural nets; Neural
                 networks; regression analysis; speech parameters;
                 Speech synthesis; speech synthesis; stacked Bayesian
                 kernel regressions; Statistical parametric speech
                 synthesis; statistical parametric speech synthesis
                 framework; stochastic variational inference; Training

  author =       "K. Shimada and Y. Bando and M. Mimura and K. Itoyama
                 and K. Yoshii and T. Kawahara",
  title =        "Unsupervised Speech Enhancement Based on Multichannel
                 {NMF}-Informed Beamforming for Noise-Robust Automatic
                 Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "5",
  pages =        "960--971",
  month =        may,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "array signal processing; Array signal processing;
                 audio signal processing; beamforming; Covariance
                 matrices; covariance matrices; Estimation; full-rank
                 multichannel Wiener filters; minimum variance
                 distortionless response beamforming; multichannel
                 NMF-informed beamforming; multichannel nonnegative
                 matrix factorization; multichannel speech enhancement;
                 MVDR beamformers; neural nets; noise components; Noise
                 measurement; noise-robust automatic speech recognition;
                 noisy environments; Noisy speech recognition; observed
                 noisy mixtures; rank-1 multichannel Wiener filters;
                 separated speech; source separation; spatial
                 information; Spectrogram; speech enhancement; Speech
                 enhancement; speech recognition; time-frequency bin;
                 unknown noisy environment; unsupervised approach;
                 unsupervised speech enhancement; Wiener filters",

  author =       "S. Widmark",
  title =        "Causal {MSE}-Optimal Filters for Personal Audio
                 Subject to Constrained Contrast",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "5",
  pages =        "972--987",
  month =        may,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic contrast; acoustic signal processing;
                 Acoustics; audio signal processing; bright zone
                 behavior; causal MSE-optimal filters; constrained
                 contrast; Design methodology; direct method; filtering
                 theory; filters; Frequency control; frequency-domain
                 analysis; Frequency-domain analysis; frequency-domain
                 optimal method; IIR filters; Mathematical model; novel
                 design method; optimisation; Optimization; personal
                 audio subject; pre-compensation filters; pre-existing
                 noncausal methods; Signal processing; sound-system-room
                 interactions; spectral bright zone behavior; Speech
                 processing; unattainable contrasts",

  author =       "Anonymous",
  title =        "Article Awards for the {{\booktitle{IEEE\slash ACM
                 Transactions on Audio, Speech, and Language
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "5",
  pages =        "988--988",
  month =        may,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Awards",

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "5",
  pages =        "C3--C3",
  month =        may,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "6",
  pages =        "C1--989",
  month =        jun,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "6",
  pages =        "C2--C2",
  month =        jun,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of contents {(EDICS)}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "6",
  pages =        "990--991",
  month =        jun,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "A. Mesaros and A. Diment and B. Elizalde and T.
                 Heittola and E. Vincent and B. Raj and T. Virtanen",
  title =        "Sound Event Detection in the {DCASE 2017} Challenge",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "6",
  pages =        "992--1006",
  month =        jun,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal detection; acoustic signal processing;
                 Acoustics; confidence interval calculation; confidence
                 intervals; DCASE 2017 challenge; deep neural networks;
                 Detection and Classification of Acoustic Scenes and
                 Events; detection requirements; Event detection; Glass;
                 Hidden Markov models; jackknife estimates; jackknife
                 resampling procedure; learning (artificial
                 intelligence); maximization-minimization; mel
                 frequency-based representations; neural nets;
                 overlapping events; pattern recognition; ranking
                 metric; signal classification; signal representation;
                 Sound event detection; sound event detection; Speech
                 processing; statistical analysis; target sound events;
                 Task analysis; task-specific optimization; testing
                 data; Training; training data; weak labels; weakly
                 labeled data",

  author =       "S. R. Chetupalli and T. V. Sreenivas",
  title =        "Late Reverberation Cancellation Using {Bayesian}
                 Estimation of Multi-Channel Linear Predictors and
                 {Student}'s $t$-Source Prior",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "6",
  pages =        "1007--1018",
  month =        jun,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Bayes methods; Bayesian estimation; Bayesian learning;
                 channel estimation; delayed linear predictor;
                 Dereverberation; early reflection component; enhanced
                 signals; Estimation; expectation-maximisation
                 algorithm; Fourier transforms; gamma distributed
                 precision; gamma distribution; Gaussian distribution;
                 Gaussian source model; hyper-parameter estimation;
                 inference estimation; late reverberation cancellation;
                 late reverberation suppression; linear prediction;
                 MCLP; microphone; Microphones; MIMO communication; MIMO
                 schemes; MISO communication; MISO scheme; multichannel
                 linear predictors; multichannel output schemes;
                 prediction residual; Predictive models; real room
                 impulse responses; residual signal estimation;
                 Reverberation; reverberation; short-time Fourier
                 transform; single channel output schemes; sparse
                 coefficient vector; spatial filtering; spatial filters;
                 stochastic models; student t-distribution model;
                 student t-source prior; time-dependent precision;
                 transient response; variational Bayes expectation
                 maximization algorithm; variational inference;
                 variational techniques; VBEM algorithm",

  author =       "L. Juvela and B. Bollepalli and V. Tsiaras and P.
  title =        "{GlotNet} --- a Raw Waveform Model for the Glottal
                 Excitation in Statistical Parametric Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "6",
  pages =        "1019--1030",
  month =        jun,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic features; Acoustics; Computational modeling;
                 direct speech waveform model; feedforward neural nets;
                 generative neural network models; GlotNet; glottal
                 excitation waveforms; glottal pulseforms; Glottal
                 source model; glottal vocoders; Hidden Markov models;
                 human voice production mechanism; model complexity;
                 model size; Neural networks; raw audio; raw waveform
                 glottal excitation model; raw waveform model; speech
                 processing; speech synthesis; Speech synthesis; speech
                 waveforms; statistical analysis; statistical parametric
                 speech synthesis; statistical parametric TTS system;
                 statistical vocoders; straightforward deep feedforward
                 neural networks; synthesis quality; text-to-speech;
                 text-to-speech synthesis; time-domain waveforms;
                 vocoders; Vocoders; voice similarity; waveform
                 generator architecture; WaveNet; WaveNet-like

  author =       "F. Winter and F. Schultz and G. Firtha and S. Spors",
  title =        "A Geometric Model for Prediction of Spatial Aliasing
                 in {$ 2.5 $D} Sound Field Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "6",
  pages =        "1031--1046",
  month =        jun,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "2.5D sound field synthesis; acoustic signal
                 processing; active prioritization; analytical sound
                 field synthesis approaches; anti-aliasing criteria;
                 approximation theory; arbitrary convex loudspeaker
                 arrays; array signal processing; artefact-free
                 synthesis; control region; conventional wave field
                 synthesis; finite ensemble; Frequency synthesizers;
                 fundamental sound fields; geometric model; geometrical
                 framework; geometry; Geometry; local sound field
                 synthesis approaches; local wave field synthesis;
                 loudspeaker array arrangements; loudspeakers;
                 Loudspeakers; Mathematical model; Numerical models;
                 numerical simulation; plane waves; predicted spatial
                 structure; Predictive models; ray-approximation; signal
                 sampling; signal synthesis; Sound field synthesis;
                 sound reproduction; spatial aliasing; spatial aliasing
                 artefacts; spatial aliasing avoidance; spatial sampling
                 process; spatial structure; Speech processing;
                 spherical waves; synthesis problem; synthesised sound
                 fields; time 2.5 d",

  author =       "Y. Liu and T. Lee and T. Law and K. Y. Lee",
  title =        "Acoustical Assessment of Voice Disorder With
                 Continuous Speech Using {ASR} Posterior Features",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "6",
  pages =        "1047--1059",
  month =        jun,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic features; acoustical assessment; ASR
                 features; ASR posterior features; ASR-based voice
                 features; automatic speech recognition system;
                 automating voice assessment; continuous speech;
                 continuous speech utterances; conventional features;
                 conventional voice features; Databases; deep neural
                 network; disordered voice; DNN based ASR system;
                 Feature extraction; homogeneous speech samples;
                 individual utterances; low-dimension ASR-based feature
                 vector; Mel frequency cepstral coefficient; mild
                 disorder; neural nets; normal voice; Pathology; phone
                 posterior probabilities; posterior features;
                 probability; Reliability; severe disorder; Speech
                 processing; speech recognition; subject-level
                 prediction accuracy; sustained vowels; Task analysis;
                 utterance-level prediction accuracy; Voice assessment;
                 voice disorder severity",

  author =       "C. P{\"o}rschmann and J. M. Arend and F. Brinkmann",
  title =        "Directional Equalization of Sparse Head-Related
                 Transfer Function Sets for Spatial Upsampling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "6",
  pages =        "1060--1071",
  month =        jun,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; directional equalization;
                 directional rigid sphere transfer function;
                 full-spherical sets; Harmonic analysis; head-related
                 transfer functions; head-related transfer functions
                 (HRTFs); interpolation; Interpolation; inverse SH
                 transform; inverse transforms; order-limitation errors;
                 set theory; SH interpolation; sparse datasets; sparse
                 HRTF set; Spatial audio; spatial complexity; Spatial
                 resolution; spatial upsampling; spectral components;
                 Speech processing; spherical harmonics; temporal
                 component; Time-domain analysis; Transfer functions;
                 transfer functions; Transforms",

  author =       "S. S. Payal and V. J. Mathews and D. J. Button and A.
                 Iyer and R. H. Lambert and J. Hutchings and L. A.
  title =        "Equalization of Nonlinear Propagation Distortion in
                 Cylindrical Waveguides",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "6",
  pages =        "1072--1084",
  month =        jun,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustic distortion; acoustic waveforms; Acoustic
                 waveguides; air-filled waveguide; Atmospheric modeling;
                 Burgers propagation model; circular waveguides;
                 equalisers; equalization; Equalizers; forward model;
                 harmonic distortion; high sound pressure levels;
                 intermodulation distortion; inverse problems;
                 Mathematical model; model-based method; model-based
                 pre-equalizer; Nonlinear acoustics; nonlinear
                 distortion; Nonlinear distortion; nonlinear
                 equalization; nonlinear propagation distortion;
                 nonlinear systems; propagation-induced distortion;
                 sign-inverted propagation model; total harmonic
                 distortion; wave propagation",

  author =       "B. Sisman and M. Zhang and H. Li",
  title =        "Group Sparse Representation With {WaveNet} Vocoder
                 Adaptation for Spectrum and Prosody Conversion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "6",
  pages =        "1085--1097",
  month =        jun,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "activation matrix; Continuous wavelet transforms;
                 conversion framework; Dictionaries; energy contour;
                 feature conversion module; feature conversion studies;
                 Gaussian processes; general speech corpus; general
                 speech databases; group sparse representation; group
                 sparsity mathematical formulation; matrix algebra;
                 natural language processing; objective evaluations;
                 phonetic dictionary; phonetic posteriorgrams; phonetic
                 posteriorgrams (PPGs); phonetic sparse representation;
                 Phonetics; PPG generator; prosody conversion; prosody
                 conversion techniques; prosody features; signal
                 representation; source-target training data; Sparse
                 matrices; speaker characteristic transformation;
                 speaker identity; spectral features; spectrum
                 conversion; speech coding; statistical analysis;
                 statistical approach; subjective evaluations; tandem
                 feature; target speaker data; Training data; vocoders;
                 Vocoders; vocoding quality; Voice conversion; voice
                 conversion quality; wavenet vocoder; WaveNet vocoder

  author =       "J. Lee and H. Kang",
  title =        "A Joint Learning Algorithm for Complex-Valued {T--F}
                 Masks in Deep Learning-Based Single-Channel Speech
                 Enhancement Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "6",
  pages =        "1098--1108",
  month =        jun,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "complex-valued T-F masks; complex-valued
                 time-frequency mask; complex-valued time-frequency
                 masks; Dynamic range; exact time-domain reconstruction;
                 input noisy phase component; irregular spectrogram
                 pattern; joint learning algorithm; large-scale deep
                 learning network; learning (artificial intelligence);
                 Learning systems; Linear programming; microphones;
                 Noise measurement; phase spectra; single-channel
                 microphone environment; Single-channel speech
                 enhancement; single-channel speech enhancement systems;
                 sound quality; spectrogram consistency; speech
                 enhancement; Speech enhancement; speech enhancement
                 algorithms; Time-domain analysis; time-frequency

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "6",
  pages =        "C3--C3",
  month =        jun,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "7",
  pages =        "C1--1109",
  month =        jul,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "7",
  pages =        "C2--C2",
  month =        jul,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of {Contents[Edics]}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "7",
  pages =        "1110--1111",
  month =        jul,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "J. Fle{\ss}ner and T. Biberger and S. D. Ewert",
  title =        "Subjective and Objective Assessment of Monaural and
                 Binaural Aspects of Audio Quality",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "7",
  pages =        "1112--1125",
  month =        jul,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic noise; Audio quality; audio signal
                 processing; auditory model; BAM-Q; binaural audio
                 quality degradation prediction; binaural
                 auditory-model-based quality prediction; binaural
                 quality aspects; binaural signal distortions; combined
                 monaural-binaural model; Databases; distortion;
                 Distortion measurement; generalized power-spectrum
                 model; generalized power-spectrum model for quality;
                 GPSMq; joint overall audio predictions; monaural signal
                 distortions; Nonlinear distortion; objective
                 assessment; Predictive models; Psychoacoustic models;
                 Psychoacoustics; spatial audio; subjective assessment",

  author =       "B. Yusuf and B. Gundogdu and M. Saraclar",
  title =        "Low Resource Keyword Search With Synthesized
                 Crosslingual Exemplars",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "7",
  pages =        "1126--1135",
  month =        jul,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic data; Acoustics; ASR-based baseline results;
                 average term weighted value; bottleneck features; data
                 scarcity; data-scarce settings; distance metric
                 learning; dynamic time warping; EDML systems; exemplar
                 matching; extended distance metric learner; Keyword
                 search; keyword search performance; Lattices; low
                 resource keyword search; multilingual acoustic model;
                 multilingual features; multilingual network; natural
                 language processing; Neural networks; out-of-vocabulary
                 terms; query by example; query processing;
                 query-by-example task; source languages; speech
                 processing; speech recognition; Spoken term detection;
                 synthesized crosslingual exemplars; synthetic phone
                 exemplars; target language; Training; Training data;
                 training data; transfer learning; Vocabulary",

  author =       "A. I. Koutrouvelis and R. C. Hendriks and R. Heusdens
                 and J. Jensen",
  title =        "Robust Joint Estimation of Multimicrophone Signal
                 Model Parameters",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "7",
  pages =        "1136--1150",
  month =        jul,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; array signal processing;
                 Confirmatory factor analysis; dereverberation; early
                 acoustic transfer functions; Estimation; joint
                 diagonalization; Mathematical model; microphone arrays;
                 microphone-self noise; Microphones; multimicrophone;
                 multimicrophone signal model parameters; Noise
                 measurement; parameter estimation; power spectral
                 densities; reverberation; Reverberation; robust method;
                 signal-model parameters; source separation; speech
                 enhancement; Time-frequency analysis; transfer

  author =       "B. Cauchi and K. Siedenburg and J. F. Santos and T. H.
                 Falk and S. Doclo and S. Goetze",
  title =        "Non-Intrusive Speech Quality Prediction Using
                 Modulation Energies and {LSTM}-Network",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "7",
  pages =        "1151--1163",
  month =        jul,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic conditions; Acoustic measurements; Acoustics;
                 benchmark intrusive measures; clean speech signal;
                 intrusive measures; listening tests; long short-term
                 memory cells; LSTM-network; Modulation; modulation;
                 modulation energy; modulation energy features;
                 non-intrusive prediction; nonintrusive measures;
                 nonintrusive speech quality prediction; perceived
                 speech quality; perceptual measures; perceptual speech
                 quality; perceptually evaluated signals; Prediction
                 algorithms; recurrent neural nets; recurrent neural
                 network; reference signal; reverberation; signal
                 processing algorithms; Signal processing algorithms;
                 signal-based measures; speech enhancement; Speech
                 enhancement; speech enhancement algorithm settings;
                 speech enhancement algorithms; Speech quality",

  author =       "Y. Zhang and P. Zhang and Y. Yan",
  title =        "Tailoring an Interpretable Neural Language Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "7",
  pages =        "1164--1178",
  month =        jul,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "architectural structure; autoregressive moving
                 average; autoregressive moving average processes; CNNs;
                 component interpretability; convolutional neural nets;
                 convolutional neural networks; Feature extraction;
                 History; interpretability; interpretable neural
                 language model; language modeling datasets; language
                 modeling task; learning (artificial intelligence);
                 learning method; Mathematical model; Neural language
                 models; parameterized auto-regressive moving average
                 model; Penn Treebank; prediction interpretability;
                 Predictive models; recurrent neural nets; recurrent
                 neural networks; Recurrent neural networks; RNNs;
                 short-term memory LMs; speech recognition; switchboard
                 speech recognition task; Task analysis; typical neural
                 LMs; WikiText-2 datasets",

  author =       "A. Pandey and D. Wang",
  title =        "A New Framework for {CNN}-Based Speech Enhancement in
                 the Time Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "7",
  pages =        "1179--1188",
  month =        jul,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "CNN-based speech enhancement; Convolution;
                 convolutional neural nets; convolutional neural
                 network; Convolutional neural networks; deep learning;
                 Fourier transforms; frequency domain loss;
                 Frequency-domain analysis; fully convolutional neural
                 network; learning (artificial intelligence); mean
                 absolute error; mean absolute error loss; Noise
                 measurement; noisy utterance; short-time Fourier
                 transform magnitude; speech enhancement; Speech
                 enhancement; Task analysis; time domain; time domain
                 enhancement; Time-domain analysis; time-frequency

  author =       "C. M. Vikram and N. Adiga and S. R. M. Prasanna",
  title =        "Detection of Nasalized Voiced Stops in Cleft Palate
                 Speech Using Epoch-Synchronous Features",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "7",
  pages =        "1189--1200",
  month =        jul,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "and velopharyngeal dysfunction; cepstral analysis;
                 Cleft palate; cleft palate speech; consonant-vowel
                 transitions; CP speech; Databases; epoch synchronous
                 features; epochs; feature extraction; Feature
                 extraction; glottal activity; hidden Markov models;
                 Mel-frequency cepstral coefficients; nasal consonants;
                 nasalized voiced stops; Production; single pole filter;
                 speech processing; Speech processing; speech
                 recognition; support vector machines; Surgery;
                 Time-frequency analysis; time-frequency

  author =       "H. Luo and T. Li and B. Liu and B. Wang and H. Unger",
  title =        "Improving Aspect Term Extraction With Bidirectional
                 Dependency Tree Representation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "7",
  pages =        "1201--1212",
  month =        jul,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Aspect term extraction; aspect term extraction
                 problem; aspect-based sentiment analysis; benchmark
                 SemEval datasets; bidirectional dependency tree
                 network; bidirectional dependency tree representation;
                 BiLSTM plus CRF; bottom-up propagation; Browsers;
                 Computer architecture; dependency structure feature
                 extraction; dependency syntactic tree; dependency tree
                 structure representation; directional propagation;
                 embedded representations; end-to-end framework; Feature
                 extraction; feature extraction; learning (artificial
                 intelligence); Logic gates; natural language
                 processing; recursive neural network; sentiment
                 analysis; sequential features; Software; Syntactics;
                 Task analysis; top-down propagation; tree data
                 structures; tree-structured features",

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "7",
  pages =        "C3--C3",
  month =        jul,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "8",
  pages =        "C1--1213",
  month =        aug,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "8",
  pages =        "C2--C2",
  month =        aug,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "8",
  pages =        "1214--1215",
  month =        aug,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "T. Zhang and J. Wu",
  title =        "Constrained Learned Feature Extraction for Acoustic
                 Scene Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "8",
  pages =        "1216--1228",
  month =        aug,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic scene classification; Acoustics; adaptive
                 machine learning; Computational modeling; constrained
                 learned feature extraction; convolutional neural
                 network; Deep neural networks; deep neural networks;
                 discrete Fourier transform; discrete Fourier
                 transforms; Discrete Fourier transforms; feature
                 extraction; Fourier transform; fully connected neural
                 network; graphics processing unit; Graphics processing
                 units; image classification; learning (artificial
                 intelligence); neural nets; Neural networks; recurrent
                 neural network; signal processing; signal processing
                 procedure; simulated Fourier transform module; Task
                 analysis; temporal transformer module",

  author =       "L. Gabrielli and S. Tomassetti and S. Squartini and C.
                 Zinato and S. Guaiana",
  title =        "A Multi-Stage Algorithm for Acoustic Physical Model
                 Parameters Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "8",
  pages =        "1229--1240",
  month =        aug,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic physical model parameter estimation; acoustic
                 signal; acoustic signal processing; computational
                 acoustics; Computational modeling; computational sound
                 design; computational sound design approach; deep
                 learning approach; iterative optimization; learning
                 (artificial intelligence); Measurement; multistage
                 algorithm; musical acoustics; musical instruments;
                 Neural networks; neural networks; optimisation;
                 Parameter estimation; parameter estimation;
                 perceptually motivated objective cost functions;
                 Physics-based acoustic modeling; pipe organ tones;
                 sound design process time; stochastic optimization
                 method; Stochastic processes; stochastic processes;
                 Timbre; timbre matching; time to market",

  author =       "B. Yang and H. Liu and C. Pang and X. Li",
  title =        "Multiple Sound Source Counting and Localization Based
                 on {TF}-Wise Spatial Spectrum Clustering",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "8",
  pages =        "1241--1255",
  month =        aug,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal detection; acoustic signal processing;
                 adverse acoustic environments; correlation methods;
                 enhanced TF-wise spatial spectra; Histograms; iterative
                 methods; matrix algebra; microphone array recordings;
                 Microphone arrays; microphone arrays; multiple sound
                 source counting; multiple sound source localization;
                 pattern clustering; received sensor signals;
                 Reliability; remaining global spatial spectrum;
                 Reverberation; signal denoising; signal subspace;
                 Source counting; source detection; source presence
                 possibility; spatial correlation matrix; spatial
                 spectrum assignment; TF domain; TF-wise spatial
                 spectrum; TF-wise spatial spectrum clustering;
                 time-frequency analysis; Time-frequency analysis;
                 time-frequency wise spatial spectrum clustering based
                 method; unassigned spatial spectra",

  author =       "Y. Luo and N. Mesgarani",
  title =        "{Conv-TasNet}: Surpassing Ideal Time Frequency
                 Magnitude Masking for Speech Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "8",
  pages =        "1256--1266",
  month =        aug,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Conv-TasNet system; Convolution; Decoding; Deep
                 learning; deep learning; deep learning framework;
                 end-to-end time-domain speech separation; fully
                 convolutional time-domain audio separation network;
                 ideal time-frequency magnitude masking; learning
                 (artificial intelligence); linear codes; linear
                 decoder; linear encoder; mixed signal; modified encoder
                 representations; objective distortion measures;
                 real-time; real-time speech separation applications;
                 real-world speech processing technologies; signal
                 representation; single-channel; single-channel
                 speaker-independent speech separation methods; Source
                 separation; source separation; speaker separation;
                 Spectrogram; spectrograms; speech coding; Speech
                 processing; speech separation systems; speech signal;
                 speech waveform; speech waveform representation;
                 stacked one-dimensional dilated convolutional blocks;
                 subjective quality assessment; temporal convolutional
                 network; three-speaker mixtures; time-domain;
                 Time-domain analysis; time-frequency analysis;
                 Time-frequency analysis; time-frequency representation;
                 two-speaker speech separation; weighting functions",

  author =       "A. K. Sarkar and Z. Tan and H. Tang and S. Shon and J.
  title =        "Time-Contrastive Learning Based Deep Bottleneck
                 Features for Text-Dependent Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "8",
  pages =        "1267--1279",
  month =        aug,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "automatic speech recognition systems; BN feature
                 extraction method; BN features; bottleneck feature;
                 brain; brain signals; brain states; cepstral analysis;
                 Clustering methods; deep bottleneck features; deep
                 neural networks; DNNs; DNNs discriminating speakers;
                 Feature extraction; feature extraction; fixed
                 pass-phrases; Gaussian processes; GMM-UBM; image
                 segmentation; learned features; learning (artificial
                 intelligence); Mel frequency cepstral coefficient;
                 multiframe segments; neural nets; nonstationarity
                 property; pattern clustering; Phonetics; segment-based
                 unsupervised clustering algorithm; short-time cepstral
                 features; speaker recognition; speaker verification;
                 speech data; speech frames; Speech recognition; speech
                 signals; speech utterance; TCL BN feature; TCL-BN;
                 TCL-DNNs; text-dependent speaker verification; time
                 contrastive learning concept; time-contrastive
                 features; time-contrastive learning; Training; training

  author =       "J. Chua and W. B. Kleijn",
  title =        "A Low Latency Approach for Blind Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "8",
  pages =        "1280--1294",
  month =        aug,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "blind source separation; Blind source separation; BSS
                 algorithms; Delays; demixing parameter estimation;
                 Estimation; long algorithmic delay; long analysis
                 window; low latency; low latency approach; Matrix
                 decomposition; microphones; Microphones; Microsoft
                 Windows; parameter estimation; separation performance;
                 subspace; time domain; Time-domain analysis;
                 time-frequency analysis; Time-frequency analysis;
                 time-frequency domain; traditional BSS approaches;
                 window length",

  author =       "C. Pan and J. Chen and J. Benesty and G. Shi",
  title =        "On the Design of Target Beampatterns for Differential
                 Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "8",
  pages =        "1295--1307",
  month =        aug,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic application; acoustic signal processing;
                 Acoustics; ADMM algorithm;
                 alternating-direction-method-of-multipliers algorithm;
                 array signal processing; Array signal processing; audio
                 application; classical target beampatterns;
                 differential beamformer; differential beamforming;
                 differential beamforming filter; differential
                 microphone arrays; Differential microphone arrays;
                 differential sound pressure field; effective
                 beampattern; microphone arrays; Microphone arrays;
                 optimisation; positive superposition theorem; Pressure
                 measurement; resulting beampattern; Roads; speech
                 application; Speech processing; target beampattern;
                 target DMA; useful DMA target beampatterns",

  author =       "A. M. Azmi and M. N. Almutery and H. A. Aboalsamh",
  title =        "Real-Word Errors in {Arabic} Texts: a Better Algorithm
                 for Detection and Correction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "8",
  pages =        "1308--1320",
  month =        aug,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Arabic language; arabic OCR; Arabic text;
                 computational linguistics; confusion sets-a simple
                 approach; context-sensitive; context-sensitive errors;
                 correction phase; correctly spelled word; corrects
                 real-word errors; detection phase; Dictionaries;
                 dyslexic text; learning (artificial intelligence);
                 natural language processing; optical character
                 recognition; Optical character recognition software;
                 real-word error words; Real-word errors; semantic
                 errors; Semantics; Speech processing; spelling error;
                 statistical language model; stem n-gram; Syntactics;
                 Testing; text analysis; Training; typical spell

  author =       "M. Korpusik and J. Glass",
  title =        "Deep Learning for Database Mapping and Asking
                 Clarification Questions in Dialogue Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "8",
  pages =        "1321--1334",
  month =        aug,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "convolutional neural nets; convolutional neural
                 network; convolutional neural network models;
                 crowdsourcing; database mapping; Databases; deep
                 reinforcement learning; deep RL; dialogue system;
                 entropy; entropy-based methods; Games; hybrid RL model;
                 interactive systems; learning (artificial
                 intelligence); natural language interfaces; natural
                 language processing; natural language representations;
                 natural language user queries; Natural languages;
                 nutrition domain; query languages; query processing;
                 Reinforcement learning; RL agent; rule-based method;
                 semantic embedding; Semantics; Speech processing;
                 standard feature engineering; structured database
                 entries; Task analysis; text analysis; text mismatch",

  author =       "J. Pak and J. W. Shin",
  title =        "Sound Localization Based on Phase Difference
                 Enhancement Using Deep Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "8",
  pages =        "1335--1345",
  month =        aug,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic generators; acoustic radiators; background
                 noise; classical sound source localization algorithms
                 degrades; clean source signal estimation; deep neural
                 networks; direction-of-arrival; Direction-of-arrival
                 estimation; direction-of-arrival estimation;
                 directional signals; DNN-based phase difference
                 enhancement; DoA estimation; dry source signal
                 estimation; end-fire directions; Estimation; estimation
                 theory; input interchannel phase differences;
                 interchannel phase difference; IPD enhancement;
                 Microphones; neural nets; Noise measurement;
                 reverberation; Reverberation; room impulse responses;
                 Sound source localization; Speech enhancement",

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "8",
  pages =        "C3--C3",
  month =        aug,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R. Ali and G. Bernardi and T. {van Waterschoot} and M.
  title =        "Methods of Extending a Generalized Sidelobe Canceller
                 With External Microphones",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "9",
  pages =        "1349--1364",
  month =        sep,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "beamforming; blocking matrix; eigenvalues and
                 eigenfunctions; External Microphone; GSC; GSC-LMA;
                 LMA-based generalized sidelobe canceller; local
                 microphone array; matrix algebra; Microphone arrays;
                 microphone arrays; microphone spacings;
                 Multi-Microphone Noise Reduction; Noise reduction;
                 noise reduction; rank-1 generalized eigenvalue
                 decomposition; relative transfer function; Speech
                 Enhancement; speech enhancement; Speech enhancement;
                 speech enhancement; speech estimate; Wireless
                 communication; Wireless sensor networks",

  author =       "X. Li and L. Girin and S. Gannot and R. Horaud",
  title =        "Multichannel Online Dereverberation Based on Spectral
                 Magnitude Inverse Filtering",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "9",
  pages =        "1365--1377",
  month =        sep,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Adaptation models; channel identification;
                 complex-valued CTF convolution model; Convolution;
                 convolutive transfer function; cross-relation method;
                 filtering theory; Fourier transforms; gradient descent
                 criterion; gradient methods; Indexes; inverse
                 filtering; inverse filters; least squares
                 approximations; microphones; Microphones; multichannel
                 CTF; multichannel equalization; multichannel online
                 dereverberation; multiple-input/output inverse theorem;
                 nonnegative convolution model; Online speech
                 dereverberation; online STFT magnitude inverse
                 filtering method; recursive least square criterion;
                 Reverberation; reverberation; short-time Fourier
                 transform domain; spectral magnitude inverse filtering;
                 speech enhancement; Speech processing; speech
                 recognition; STFT domain; time-domain analysis;
                 Time-domain analysis; time-domain room impulse

  author =       "L. Chen and Z. Chen and B. Tan and S. Long and M.
                 Ga{\v{s}}i{\'c} and K. Yu",
  title =        "{AgentGraph}: Toward Universal Dialogue Management
                 With Structured Deep Reinforcement Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "9",
  pages =        "1378--1391",
  month =        sep,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "AgentGraph framework; AgentGraph models; Computational
                 modeling; deep models; deep reinforcement learning;
                 dialogue domain ontology; Dialogue policy; DRL-based
                 algorithm; DRL-based policies; dual GNN-based dialogue
                 policy; GNN based architecture; graph neural network
                 based architecture; graph neural networks; graph
                 theory; high-level global decision; interactive
                 systems; learning (artificial intelligence); low-level
                 local decision; multi-agent systems; multiagent
                 reinforcement learning; neural nets; Neural networks;
                 Ontologies; ontologies (artificial intelligence);
                 Optimization; policy adaptation; policy optimization;
                 policy transfer; PyDial benchmark; Reinforcement
                 learning; structured deep reinforcement learning; Task
                 analysis; task-oriented spoken dialogue systems;
                 Training; transfer learning; universal dialogue

  author =       "L. Li and J. Wang and J. Li and Q. Ma and J. Wei",
  title =        "Relation Classification via Keyword-Attentive Sentence
                 Mechanism and Synthetic Stimulation Loss",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "9",
  pages =        "1392--1404",
  month =        sep,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Adaptation models; attention mechanism; attention
                 mechanisms; bidirectional gated recurrent unit; BiGRU;
                 Feature extraction; imbalanced classification;
                 imbalanced classification problem; Kernel;
                 keyword-attentive sentence mechanism; learning
                 (artificial intelligence); loss function; mutual
                 learning; natural language processing; Neural networks;
                 pattern classification; Relation classification;
                 relation classification; Semantics; SemEval-2010 Task 8
                 data set; shortest dependency path; SSL-KAS-MuBiGRU;
                 Syntactics; synthetic stimulation loss; TAC40 data set;
                 Task analysis",

  author =       "M. B. M{\o}ller and J. K. Nielsen and E.
                 Fernandez-Grande and S. K. Olesen",
  title =        "On the Influence of Transfer Function Noise on Sound
                 Zone Control in a Room",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "9",
  pages =        "1405--1418",
  month =        sep,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic field; acoustic leakage; Acoustic
                 measurements; acoustic separation; acoustic signal
                 processing; Acoustics; active eigenfunctions; audio
                 signal processing; frequency 20.0 Hz to 300.0 Hz;
                 headphones; high separation; in situ transfer function
                 measurements; individual audio content; inherent noise;
                 loudspeakers; Loudspeakers; measurement noise;
                 microphones; Microphones; multiple loudspeakers;
                 multiple people; Noise measurement; personal audio;
                 rectangular room; Sensitivity; sound field control;
                 sound reproduction; sound zone control; sound zone
                 methods; Sound zones; target sound field; transfer
                 function noise; Transfer functions; transfer

  author =       "Z. Xu and C. Sun and Y. Long and B. Liu and B. Wang
                 and M. Wang and M. Zhang and X. Wang",
  title =        "Dynamic Working Memory for Context-Aware Response
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "9",
  pages =        "1419--1431",
  month =        sep,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Context modeling; context representation;
                 context-aware response generation; contextual
                 utterances; conversation context modeling;
                 conversational agents; customer services; Decoding;
                 deep learning; dialog context; dynamic working memory
                 mechanism; encoder-decoder architecture; History; human
                 evaluation; human-to-human conversations; interactive
                 programming; interactive systems; Memory management;
                 Memory modules; OpenSubtitles Corpus; Response
                 generation; semantic interactions; Semantics; social
                 networking (online); Speech processing; Twitter
                 customer service corpus; ubiquitous computing",

  author =       "H. Kameoka and T. Kaneko and K. Tanaka and N. Hojo",
  title =        "{ACVAE-VC}: Non-Parallel Voice Conversion With
                 Auxiliary Classifier Variational Autoencoder",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "9",
  pages =        "1432--1443",
  month =        sep,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic feature sequences; Acoustics; ACVAE-VC;
                 Artificial neural networks; attribute class label
                 input; auxiliary classifier VAE; auxiliary classifier
                 VAE (ACVAE); auxiliary classifier variational
                 autoencoder; conditional variational autoencoder;
                 convolutional architectures; decoder output networks;
                 Decoding; decoding; fully convolutional network;
                 Gallium nitride; Generators; information-theoretic
                 regularization; learning (artificial intelligence);
                 non-parallel VC; nonparallel VC systems; nonparallel
                 voice conversion process; open-source parallel VC
                 system; regular conditional VAE; speaker identity
                 conversion task; speech coding; Speech recognition;
                 trained encoder; Training; variational autoencoder
                 (VAE); Voice conversion (VC)",

  author =       "X. Chen and X. Liu and Y. Wang and A. Ragni and J. H.
                 M. Wong and M. J. F. Gales",
  title =        "Exploiting Future Word Contexts in Neural Network
                 Language Models for Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "9",
  pages =        "1444--1454",
  month =        sep,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "bi-directional model; Computational modeling; Context
                 modeling; feedforward; feedforward unit; History;
                 keyword search; language model; language modeling;
                 Lattices; natural language processing; neural network
                 language model structure; probability; probability
                 distributions; recurrent neural nets; Recurrent neural
                 network; recurrent neural network LMs; Speech
                 processing; speech recognition; Speech recognition;
                 su-RNNLM; succeeding words; succeeding-word RNNLM;
                 Training; word lattices",

  author =       "R. Wang and Z. Chen and F. Yin",
  title =        "{DOA}-Based Three-Dimensional Node Geometry
                 Calibration in Acoustic Sensor Networks and Its
                 {Cram{\'e}r--Rao} Bound and Sensitivity Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "9",
  pages =        "1455--1468",
  month =        sep,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "3D rotation matrices; ABC algorithm; Acoustic sensor
                 network; acoustic sensor networks; artificial bee
                 colony algorithm; ASN geometry calibration;
                 calibration; Calibration; concave programming; Cost
                 function; Cram{\'e}r Rao bound; Cram{\'e}r-Rao bound;
                 direction of arrival; Direction-of-arrival estimation;
                 direction-of-arrival estimation; directional of arrival
                 measurements; DOA-based node geometry calibration;
                 DOA-based three-dimensional node geometry calibration;
                 Estimation; geometric structure; geometry; Geometry;
                 irregular geometric structures; matrix algebra;
                 microphones; Microphones; minimisation; node geometry
                 calibration; node geometry calibration method; node
                 geometry calibration problem; node geometry positions;
                 non-convex minimization; sensitivity analysis; sound
                 source position error; theoretical DOAs;
                 Three-dimensional displays; three-dimensional node
                 geometry calibration approach;
                 time-difference-of-arrival; tracking speakers; wireless
                 sensor networks",

  author =       "C. Lee and H. Lee and S. Wu and C. Liu and W. Fang and
                 J. Hsu and B. Tseng",
  title =        "Machine Comprehension of Spoken Content: {TOEFL}
                 Listening Test and Spoken {SQuAD}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "9",
  pages =        "1469--1480",
  month =        sep,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "academic English examination; attention model;
                 Cognition; computer aided instruction; deep learning;
                 English learners; Knowledge discovery; listening
                 comprehension task; listening comprehension test;
                 machine comprehension; native English speakers; natural
                 language processing; neural nets; second listening
                 comprehension task; Speech processing; Speech question
                 answering; speech recognition; Speech recognition;
                 spoken content; spoken SQuAD; SQuAD; Task analysis;
                 text content; TOEFL; Videos; Visualization",

  author =       "Y. Chen and S. Huang and H. Lee and Y. Wang and C.
  title =        "Audio {Word2vec}: Sequence-to-Sequence Autoencoding
                 for Unsupervised Learning of Audio Segmentation and
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "9",
  pages =        "1481--1493",
  month =        sep,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustics; audio segmentation; audio signal
                 processing; Audio word2Vec; Decoding; natural language
                 processing; phonetic information; Phonetics; Recurrent
                 neural networks; reinforcement learning; SA vector
                 representations; segmental audio word2vec;
                 sequence-to-sequence autoencoder; sequence-to-sequence
                 autoencoding; signal representation; speaker
                 information; speech processing; Speech recognition;
                 Task analysis; Training; unannotated audio word2vec;
                 unsupervised learning; unsupervised spoken word
                 boundary segmentation; word level",

  author =       "P. Li and C. Chen and W. Zheng and Y. Deng and F. Ye
                 and Z. Zheng",
  title =        "{STD}: an Automatic Evaluation Metric for Machine
                 Translation Based on Word Embeddings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "10",
  pages =        "1497--1506",
  month =        oct,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Earth; earth mover's distance; embedded n-grams;
                 language translation; lexical-based metrics;
                 Linguistics; machine translation; Machine translation
                 evaluation; Measurement; metric; MT automatic
                 evaluation; n-gram; natural language processing; NIST;
                 semantic; semantic features; semantic relationships;
                 semantic travel distance; Semantics; Speech processing;
                 STD; Syntactics; word embeddings; word order",

  author =       "J. Zhang and R. Heusdens and R. C. Hendriks",
  title =        "Relative Acoustic Transfer Function Estimation in
                 Wireless Acoustic Sensor Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "10",
  pages =        "1507--1519",
  month =        oct,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic communication (telecommunication); audio
                 recording; audio recordings; bit rate; convex
                 optimization; convex programming; Correlation;
                 correlation methods; covariance analysis; Covariance
                 matrices; covariance subtraction; covariance
                 subtraction method; covariance whitening; covariance
                 whitening approach; CS-based methods; data records;
                 eigenvalues and eigenfunctions; estimated RTF accuracy;
                 Estimation; estimation performance; expected estimation
                 error; generalized eigenvalue decomposition; greedy
                 rate-distribution methods; matrix algebra; Matrix
                 decomposition; Microphones; minimisation; model-based
                 methods; model/data-driven rate distribution; Noise
                 measurement; noisy correlation matrix; numerical
                 analysis; numerical simulations; optimal rate
                 distributions; power usage; power usage minimization;
                 quantization; Quantization (signal); rate-distributed
                 CW methods; relative acoustic transfer function
                 estimation; relative transfer function; RTF estimation
                 accuracy; Sensor networks; telecommunication power
                 management; transfer functions; uniform rate
                 allocation; WASN; wireless acoustic sensor networks;
                 wireless sensor networks",

  author =       "J. Park and J. Chang",
  title =        "State-Space Microphone Array Nonlinear Acoustic Echo
                 Cancellation Using Multi-Microphone Near-End Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "10",
  pages =        "1520--1534",
  month =        oct,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustic arrays; acoustic signal processing; acoustic
                 transfer function vector; approximation theory; array
                 signal processing; ATF vector estimation; echo
                 reduction; echo suppression; Eigenvalue decomposition;
                 Kalman filter; Kalman filters; linear acoustic path;
                 loudspeaker; loudspeakers; Low-rank approximation;
                 low-rank approximation; microphone array NAEC
                 algorithm; Microphone array nonlinear acoustic echo
                 cancellation; Microphone arrays; microphone arrays;
                 Multi-microphone near-end speech covariance;
                 multimicrophone near-end speech covariance;
                 multimicrophone Wiener filtering; near-end speech
                 quality; Nonlinear acoustics; nonlinear acoustics;
                 Parameterized multi-microphone Wiener filter; power
                 series; recursive estimation; residual echo;
                 reverberant condition; reverberation; SER; Signal
                 processing algorithms; signal-to-echo ratio;
                 single-microphone nonlinear AEC algorithm;
                 single-microphone-based model; Speech processing;
                 speech processing; state-space equation; state-space
                 methods; state-space microphone array nonlinear
                 acoustic echo cancellation; State-space modeling;
                 transfer functions; Wiener filters",

  author =       "Z. Luo and J. Chen and T. Takiguchi and Y. Ariki",
  title =        "Emotional Voice Conversion Using Dual Supervised
                 Adversarial Networks With Continuous Wavelet Transform
                 {F0} Features",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "10",
  pages =        "1535--1548",
  month =        oct,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic features; acoustic signal processing;
                 adaptive scales continuous wavelet transform; ADS-CWT
                 method; continuous wavelet transform F0 features;
                 Continuous wavelet transforms; dual supervised
                 adversarial networks; dual supervised learning; emotion
                 recognition; emotional VC experiments; emotional VC
                 task; Emotional voice conversion; emotional voice
                 conversion tasks; emotional voice representation;
                 feature extraction; generative adversarial networks;
                 Hidden Markov models; labeled emotional voice; learning
                 (artificial intelligence); low-level data space;
                 neutral voice; over-smoothing problem; prosodic
                 aspects; speech processing; Supervised learning; Task
                 analysis; temporal levels; Training; training
                 performance improvement; wavelet transform; wavelet

  author =       "H. As'ad and M. Bouchard and H. Kamkar-Parsi",
  title =        "A Robust Target Linearly Constrained Minimum Variance
                 Beamformer With Spatial Cues Preservation for Binaural
                 Hearing Aids",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "10",
  pages =        "1549--1563",
  month =        oct,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; anechoic propagation;
                 anechoic reverberant environments; array signal
                 processing; Array signal processing; background noise;
                 binaural beamforming algorithm; binaural cues
                 preservations; binaural hearing aids; complex realistic
                 acoustic scenarios; direction of arrival estimation;
                 direction-of-arrival estimation; Direction-of-arrival
                 estimation; directional interferers directions;
                 Estimation; Hearing aids; hearing aids; higher order
                 statistics; Microphones; mildly reverberant
                 environments; noise reduction; Noise reduction;
                 noise-only components; post-processor; propagation
                 model mismatch; reverberation; Robust LCMV; robust
                 target linearly constrained minimum variance
                 beamformer; robust TLCMV; second-order statistics;
                 simulated directional signals; spatial cues
                 preservation; speech processing; steering vector
                 mismatch; target distortion; target signal; target
                 speaker direction",

  author =       "Y. Wang and Y. Xia and L. Zhao and J. Bian and T. Qin
                 and E. Chen and T. Liu",
  title =        "Semi-Supervised Neural Machine Translation via
                 Marginal Distribution Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "10",
  pages =        "1564--1576",
  month =        oct,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Computational modeling; Data models; Decoding;
                 Mathematical model; natural language processing; Neural
                 machine translation; Neural networks; semi-supervised
                 learning; Task analysis; Training",

  author =       "A. Jati and P. Georgiou",
  title =        "Neural Predictive Coding Using Convolutional Neural
                 Networks Toward Unsupervised Learning of Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "10",
  pages =        "1577--1589",
  month =        oct,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Convolutional Neural Networks (CNN); Neural networks;
                 Predictive coding; siamese network; Speaker
                 recognition; speaker recognition; Speaker-specific
                 characteristics; Speech processing; Speech recognition;
                 Task analysis; Training; unsupervised learning",

  author =       "F. Fontana and E. Bozzo",
  title =        "{Newton--Raphson} Solution of Nonlinear Delay-Free
                 Loop Filter Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "10",
  pages =        "1590--1600",
  month =        oct,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "basin of convergence; Computational modeling;
                 Convergence; Digital delay-free loop; diode clipper;
                 Integrated circuit modeling; Mathematical model;
                 Modulation; Newton method; Newton-Raphson method;
                 nonlinear filter network; ring modulator; Tools;
                 virtual analogue",

  author =       "N. Makishima and S. Mogami and N. Takamune and D.
                 Kitamura and H. Sumino and S. Takamichi and H.
                 Saruwatari and N. Ono",
  title =        "Independent Deeply Learned Matrix Analysis for
                 Determined Audio Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "10",
  pages =        "1601--1615",
  month =        oct,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Audio source separation; Covariance matrices; Data
                 models; deep neural networks; Estimation; independent
                 component analysis; Power capacitors; semi-supervised
                 learning; Source separation; Spectrogram;
                 Time-frequency analysis",

  author =       "J. J. Prakash and H. A. Murthy",
  title =        "Analysis of Inter-Pausal Units in {Indian} Languages
                 and Its Application to Text-to-Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "10",
  pages =        "1616--1628",
  month =        oct,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Databases; Gamma distribution; gamma distribution;
                 Hidden Markov models; Inter-pausal unit; IPU-based
                 TTSes; Machine learning; number of syllables; phrasing;
                 Speech processing; Syntactics; Training",

  author =       "Y. Lan and S. Wang and J. Jiang",
  title =        "Knowledge Base Question Answering With a
                 Matching-Aggregation Model and Question-Specific
                 Contextual Relations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "10",
  pages =        "1629--1638",
  month =        oct,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Artificial intelligence; Context modeling; knowledge
                 base question answering; Knowledge based systems;
                 Knowledge discovery; natural language processing;
                 Natural languages; Neural networks; Semantics; Task

  author =       "X. Bai and H. Cao and K. Chen and T. Zhao",
  title =        "A Bilingual Adversarial Autoencoder for Unsupervised
                 Bilingual Lexicon Induction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "10",
  pages =        "1639--1648",
  month =        oct,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "bilingual lexicon induction; Computational modeling;
                 Correlation; Decoding; Dictionaries; Speech processing;
                 Training; Transforms; unsupervised word mapping; Word

  author =       "G. Zhao and R. Gutierrez-Osuna",
  title =        "Using Phonetic Posteriorgram Based Frame Pairing for
                 Segmental Accent Conversion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "10",
  pages =        "1649--1660",
  month =        oct,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Accent conversion; acoustic model; Acoustics;
                 Computational modeling; Phonetics; posteriorgram;
                 Signal processing algorithms; Speech processing;
                 Training; Trajectory; voice conversion",

  author =       "Z. Zhang and H. Zhao and K. Ling and J. Li and Z. Li
                 and S. He and G. Fu",
  title =        "Effective Subword Segmentation for Text
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "11",
  pages =        "1664--1674",
  month =        nov,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Linguistics; machine reading comprehension; Robot
                 sensing systems; Semantics; Speech processing; Subword
                 embedding; Task analysis; textual entailment; word

  author =       "Y. Xie and R. Liang and Z. Liang and C. Huang and C.
                 Zou and B. Schuller",
  title =        "Speech Emotion Classification Using Attention-Based
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "11",
  pages =        "1675--1685",
  month =        nov,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "attention mechanism; frame-level features; LSTM;
                 Speech emotion",

  author =       "S. Wang and Z. Huang and Y. Qian and K. Yu",
  title =        "Discriminative Neural Embedding Learning for
                 Short-Duration Text-Independent Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "11",
  pages =        "1686--1696",
  month =        nov,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Analytical models; angular softmax; center loss;
                 Feature extraction; Linear discriminant analysis;
                 Neural networks; Optimization; Short-duration
                 text-independent speaker verification; speaker neural
                 embedding; Speech processing; Training; triplet loss",

  author =       "R. Lu and Z. Duan and C. Zhang",
  title =        "Audio Visual Deep Clustering for Speech Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "11",
  pages =        "1697--1712",
  month =        nov,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 3 09:10:28 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "audio-visual fusion; deep clustering; Hidden Markov
                 models; Lips; Robustness; Speaker-independent speech
                 separation; Spectrogram; Speech processing; Training;

  author =       "N. Ueno and S. Koyama and H. Saruwatari",
  title =        "Three-Dimensional Sound Field Reproduction Based on
                 Weighted Mode-Matching Method",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "1852--1867",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic field; acoustic signal processing; array
                 geometries; directivities; exterior sound field
                 reproduction; Geometry; Harmonic analysis; interior
                 reproduction; loudspeakers; Loudspeakers; Minimization;
                 Mode-matching method; multizone reproduction; numerical
                 analysis; optimal driving signals; optimal weight;
                 reproduction accuracy; sound field reproduction; sound
                 field reproduction method; sound field synthesis; sound
                 reproduction; Speech processing; spherical wavefunction
                 expansion; Three-dimensional displays;
                 three-dimensional sound field reproduction; Two
                 dimensional displays; weighted mode-matching method",

  author =       "L. Wu and X. Tan and T. Qin and J. Lai and T. Liu",
  title =        "Beyond Error Propagation: Language Branching Also
                 Affects the Accuracy of Sequence Generation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "1868--1879",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "abstractive summarization; accuracy drop; accuracy
                 drop problem; autoregressive training; Decoding; error
                 propagation; error propagation problem; language
                 characteristic; language modeling; left-branching
                 language; Linguistics; Maximum likelihood estimation;
                 Measurement; natural language processing; neural
                 machine translation; Sequence generation; sequence
                 generation task; sequence generation tasks; Speech
                 processing; Task analysis; text analysis; Training",

  author =       "A. Das and J. Li and G. Ye and R. Zhao and Y. Gong",
  title =        "Advancing Acoustic-to-Word {CTC} Model With Attention
                 and Mixed-Units",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "1880--1892",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic-to-word; acoustic-to-word CTC model;
                 Acoustics; attention; attention modeling; complex
                 decoder; connectionist temporal classification
                 criterion; Context modeling; context weighted inputs;
                 CTC; CTC network; Data models; Decoding; E2E system;
                 end-to-end system; frequent words; frequently occurring
                 words; hard alignment issue; hybrid CTC; learning
                 (artificial intelligence); letter CTC; Microsoft
                 Cortana voice assistant task; mixed-unit CTC;
                 multiletter units; OOV; OOV issue; OOV words;
                 out-of-vocabulary issue; recurrent neural nets;
                 Recurrent neural networks; self-attention CTC; shared
                 hidden layers; speech coding; speech recognition;
                 Training; Training data; vanilla word CTC; vocabulary;
                 word error rate; word tagging; word-based CTC model",

  author =       "N. Antonello and E. {De Sena} and M. Moonen and P. A.
                 Naylor and T. {van Waterschoot}",
  title =        "Joint Acoustic Localization and Dereverberation
                 Through Plane Wave Decomposition and Sparse
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "1893--1905",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic model; acoustic signal processing; acoustic
                 source localization; Acoustics; Approximation
                 algorithms; dereverberated signals; Dereverberation;
                 diffuse noise; direction of arrival;
                 Direction-of-arrival estimation; direction-of-arrival
                 estimation; DOA; Estimation; first order optimization
                 algorithm; inverse problem; inverse problems; Inverse
                 problems; inverse problems; joint acoustic localization
                 and dereverberation; large-scale optimization problem;
                 localized noise; microphone positions; microphones;
                 Microphones; moving sound source; noise reduction;
                 optimisation; Optimization; plane wave decomposition;
                 reverberation; signal denoising; sound field; sound
                 pressure; source localization; source separation;
                 sparse regularization; sparse sensing; spatiospectral
                 sparsity; spectral analysis; speech processing; weight
                 signals; weighted overlap-add procedure",

  author =       "F. Borra and A. Bernardini and F. Antonacci and A.
  title =        "Uniform Linear Arrays of First-Order Steerable
                 Differential Microphones",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "1906--1918",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "array signal processing; Array signal processing;
                 audio signal processing; Beamforming; beamforming
                 method; delay-and-sum beamformer; design methodologies;
                 differential microphones; directivity factor; filtering
                 layers; first-order steerable differential microphones;
                 FOSDMs; Geometry; microphone arrays; Microphone arrays;
                 Sensor arrays; single scalar parameter; spatial
                 filtering method; spatial filters; traditional spatial
                 filtering techniques; two-layer spatial filter; uniform
                 linear arrays; White noise; white noise; white noise

  author =       "L. Chai and J. Du and Q. Liu and C. Lee",
  title =        "Using Generalized {Gaussian} Distributions to Improve
                 Regression Error Modeling for Deep Learning-Based
                 Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "1919--1931",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "assumed homoscedastic Gaussian error model; clean
                 log-power spectral components; consistent improvements;
                 conventional DNN framework; conventional minimum;
                 conventional MMSE criterion; deep learning-based speech
                 enhancement; deep neural network; DNN input vectors;
                 DNN outputs; Gaussian distribution; Gaussian processes;
                 generalized Gaussian distribution; generalized Gaussian
                 distributions; GGD error model; heteroscedastic
                 properties; improved generalization; learning
                 (artificial intelligence); least mean squares methods;
                 Linear programming; maximum likelihood estimation;
                 maximum likelihood solution; mean square error methods;
                 ML criterion; ML optimization objective; neural nets;
                 noise; noisy LPS features; nonlinear regression deep
                 neural network-based speech enhancement; prediction
                 error modeling; prediction error vector; prediction
                 errors; Predictive models; regression analysis;
                 regression error modeling; robustness; speech
                 enhancement; Speech enhancement; speech processing;
                 squared error criterion; statistical analysis;
                 statistical perspective; statistically independent
                 random variables; super-Gaussian properties; Task
                 analysis; Training",

  author =       "J. Qi and J. Du and S. M. Siniscalchi and C. Lee",
  title =        "A Theory on Deep Neural Network Based Vector-to-Vector
                 Regression With an Illustration of Its Expressive Power
                 in Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "1932--1943",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "ANN structures; ANN-based regression function;
                 artificial neural network; Biological neural networks;
                 broader hidden layer; Computer architecture; deep
                 neural network; Deep neural network; deeper
                 architecture; expected clean speech; expressive power;
                 function approximation; functional approximation;
                 hidden layers; log power spectra; neural nets; Noise
                 measurement; noisy expected clean speech;
                 recently-emerged DNN based speech enhancement;
                 regression analysis; regression performance;
                 signal-to-noise-ratio levels; Speech enhancement;
                 speech enhancement; Task analysis; top hidden layer;
                 universal approximation; vector-to-vector regression;
                 vector-to-vector regression functions; vectors",

  author =       "X. Dang and Q. Cheng and H. Zhu",
  title =        "Indoor Multiple Sound Source Localization via
                 Multi-Dimensional Assignment Data Association",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "1944--1956",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; Arrays; association costs;
                 data association; direction of arrival;
                 Direction-of-arrival estimation; direction-of-arrival
                 estimation; Estimation; false alarm-originated subsets;
                 false alarms; Feature extraction; indoor environments;
                 indoor multiple sound source localization; microphone
                 arrays; Microphone arrays; missed detections;
                 multidimensional assignment data association;
                 multidimensional assignment-based data association
                 approach; multiple microphone arrays; Multiple sound
                 source localization; multiple sound source localization
                 problem; multisource scenarios; optimal associations;
                 Position measurement; sensor fusion; source-originated
                 DOA estimates; target tracking",

  author =       "M. Schneider and E. A. P. Habets",
  title =        "Iterative {DFT}-Domain Inverse Filter Optimization
                 Using a Weighted Least-Squares Criterion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "1957--1969",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "approximation algorithms; Digital filters; discrete
                 Fourier transform domain; discrete Fourier transforms;
                 Discrete Fourier transforms; effective regularization
                 method; finite impulse response filters; Finite impulse
                 response filters; FIR filters; frequency-domain
                 analysis; Frequency-domain analysis; frequency-domain
                 weight; iterative DFT-domain inverse filter
                 optimization; iterative methods; jointly optimized
                 filter coefficients; least squares approximation; least
                 squares approximations; least-squares-optimal filter
                 coefficients; Mathematical model; optimisation;
                 Optimization; regularization parameters; sound-zones
                 scenario; Speech processing; Time-domain analysis;
                 time-domain analysis; time-domain filter coefficients;
                 time-domain weights; weighted least-squares criterion",

  author =       "K. Chen and R. Wang and M. Utiyama and E. Sumita and
                 T. Zhao",
  title =        "Neural Machine Translation With Sentence-Level Topic
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "1970--1984",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Computer architecture; Context modeling; Convolution;
                 convolution neural network; convolutional neural nets;
                 Convolutional Neural Network; Decoding;
                 English-to-German translation tasks; Feature
                 extraction; language translation; Latent Topic
                 Representation; latent topic representations; LDC
                 Chinese-to-English translation tasks; natural language
                 processing; Neural Machine Translation; neural machine
                 translation methods; Sentence-level Context;
                 sentence-level context; source sentence-level topic
                 context information; Speech processing; statistical
                 machine translation; target language translation; Task
                 analysis; topic attention; transformer-based NMT;
                 translation prediction; word-level context",

  author =       "A. Gomez-Alanis and A. M. Peinado and J. A. Gonzalez
                 and A. M. Gomez",
  title =        "A Gated Recurrent Convolutional Neural Network for
                 Robust Spoofing Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "1985--1999",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "anti-spoofing techniques; antispoofing system; ASV;
                 automatic speaker verification systems; clean
                 scenarios; Convolutional neural networks; deep feature
                 extractor; deep features; deep learning; Feature
                 extraction; feature extraction; gated recurrent
                 convolutional neural networks; input spectral features;
                 Logic gates; logical access attacks; logical scenarios;
                 Noise measurement; noise robustness; noisy conditions;
                 noisy environments; physical scenarios; recurrent
                 neural nets; robust spoofing detection; Robustness;
                 signal-to-noise masks; speaker recognition; speaker
                 verification; Speech processing; speech signals;
                 spoofing attacks; Spoofing detection; Training;
                 utterance-level embeddings",

  author =       "S. Feng and T. Lee",
  title =        "Exploiting Cross-Lingual Speaker and Phonetic
                 Diversity for Unsupervised Subword Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2000--2011",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic modeling; Acoustics; across-speaker triphone
                 minimal-pair; Adaptation models; automatic speech
                 recognition systems; Clustering algorithms;
                 cross-lingual speaker; deep neural networks; feature
                 learning; frame clustering; frame-level labels; Hidden
                 Markov models; high-quality frame labels; individual
                 target languages; learning (artificial intelligence);
                 low-resource languages; MTL-DNN; multi-task learning;
                 multilingual bottleneck features; multitask learning;
                 neural nets; out-of-domain ASR systems; out-of-domain
                 languages; phonetic diversity; resource-rich; robust
                 BNF representations; robust features; robust
                 frame-level feature representations; speaker
                 adaptation; Speech processing; speech recognition;
                 subword-level speech units; supervised DNN training;
                 target language; Task analysis; Training; training
                 data; training speech; transcribed speech data;
                 transcribed training data; unsupervised learning;
                 unsupervised subword modeling; untranscribed training
                 data; Zero resource",

  author =       "W. Li and N. F. Chen and S. M. Siniscalchi and C.
  title =        "Improving Mispronunciation Detection of {Mandarin}
                 Tones for Non-Native Learners With Soft-Target Tone
                 Labels and {BLSTM}-Based Deep Tone Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2012--2024",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustics; BLSTM-based verifiers; canonical tone
                 categories; Computer-assisted language learning (CALL);
                 computer-assisted pronunciation training (CAPT);
                 Context modeling; Data mining; deep learning; Feature
                 extraction; hard target labels; hard targets; Hidden
                 Markov models; L2 learners; language learners whose
                 first language; Mandarin lexical tones;
                 mispronunciation detection; natural language
                 processing; neural nets; non-native tone modeling and
                 mispronunciation detection; nonnative learners;
                 nonnative tone productions; pattern classification;
                 Production; segmental tone features; sequential context
                 information; short-term memory network; soft targets;
                 soft-target tone labels; speech processing; Speech
                 processing; speech recognition; tone posteriors;
                 tone-level co-articulation; train binary classifiers;
                 trained tone models",

  author =       "Q. Tu and H. Chen",
  title =        "On Mainlobe Orientation of the First- and Second-Order
                 Differential Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2025--2040",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; Acoustics; array signal
                 processing; Differential microphone array; first order
                 DMA; first-order differential microphone arrays; fixed
                 endfire direction; Gain; lower-order differential
                 microphone arrays; mainlobe orientation; Microphone
                 arrays; microphone arrays; microphone mismatches;
                 second-order differential microphone arrays;
                 second-order DMA; Sensitivity; Speech processing;
                 Tolerance analysis; tolerance analysis",

  author =       "J. Chorowski and R. J. Weiss and S. Bengio and A. {van
                 den Oord}",
  title =        "Unsupervised Speech Representation Learning Using
                 {WaveNet} Autoencoders",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2041--2053",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; acoustic unit discovery;
                 Autoencoder; autoencoder models; autoencoding neural
                 networks; Decoding; discrete vector quantized VAE;
                 Feature extraction; Gaussian processes; Gaussian
                 variational autoencoder; high capacity WaveNet decoder;
                 high level semantic content; latent representation;
                 latent representations; learning (artificial
                 intelligence); low level details; neural nets; Neural
                 networks; phoneme identities; phonetic content;
                 Phonetics; pitch contour; Prototypes; simple
                 dimensionality reduction bottleneck; speech processing;
                 Speech processing; speech representation learning;
                 speech waveforms; Task analysis; unsupervised
                 extraction; unsupervised learning; unsupervised speech
                 representation; vector quantisation; VQ-VAE; WaveNet
                 autoencoders; ZeroSpeech 2017 unsupervised acoustic
                 unit discovery task",

  author =       "V. Varanasi and A. Agarwal and R. M. Hegde",
  title =        "Near-Field Acoustic Source Localization Using
                 Spherical Harmonic Features",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2054--2066",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; Acoustics; Array signal
                 processing; array signal processing; beamforming;
                 convolutional neural nets; convolutional neural
                 network; direction independent features; direction of
                 arrival estimation; Direction-of-arrival estimation;
                 direction-of-arrival estimation; Estimation; Feature
                 extraction; Harmonic analysis; interpolation; learning
                 (artificial intelligence); learning- based framework;
                 Microphones; near-field acoustic source localization;
                 Near-field beamforming; near-held DOA estimation;
                 pressure distribution; range estimation; reverberant
                 conditions; Root mean square error; signal invariant
                 features; source signal strength; spatial pressure
                 interpolation; spherical harmonic domain; spherical
                 harmonic features; spherical microphone array; voice
                 activity detection; voicing activity detection;
                 Wigner-D functions",

  author =       "Y. Zheng and J. Tao and Z. Wen and J. Yi",
  title =        "Forward Backward Decoding Sequence for Regularizing
                 End-to-End {TTS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2067--2079",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustics; Decoding; decoding; directional models;
                 divergence regularization terms; encoder-decoder with
                 attention; end-to-end; English; Forward-backward;
                 forward-backward decoding sequence; joint training
                 method; joint-training; learning (artificial
                 intelligence); Linguistics; Mandarin; model training;
                 regularization; regularizing end-to-end TTS;
                 regularizing neural end-to-end TTS; speech coding;
                 Speech processing; Speech recognition; speech
                 synthesis; Tacotron; target generation; Training; TTS",

  author =       "Y. Tu and J. Du and C. Lee",
  title =        "Speech Enhancement Based on Teacher Student Deep
                 Learning Using Improved Speech Presence Probability for
                 Noise-Robust Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2080--2091",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Adaptation models; BGRU-equipped student model;
                 bidirectional gated recurrent units; causal processing
                 mode; CHiME-4 challenge task; complex noncausal teacher
                 model; Computational modeling; deep learning based
                 speech enhancement; deep neural network; error
                 statistics; IMCRA; improved minima controlled recursive
                 averaging; improved speech presence probability;
                 IRM-based deep learning method; learning (artificial
                 intelligence); neural nets; noise; Noise measurement;
                 noise-robust speech recognition; nonlinear
                 interactions; online noise tracking; ratio masks;
                 regression-based enhancement model; relative WER
                 reduction; speech enhancement; Speech enhancement;
                 speech enhancement; Speech recognition; speech
                 recognition; teacher-student deep learning;
                 Teacher-student learning; Training; word error rate",

  author =       "Y. Liu and D. Wang",
  title =        "Divide and Conquer: A Deep {CASA} Approach to
                 Talker-Independent Monaural Speaker Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2092--2102",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "acoustic signal processing; audio databases;
                 computational auditory scene analysis; deep CASA; deep
                 CASA approach; deep learning; Deep learning; divide and
                 conquer; divide and conquer methods; frame-level
                 separated spectra; frame-level separation; Image
                 analysis; Indexes; learning (artificial intelligence);
                 Monaural speech separation; multispeaker separation
                 task; neural nets; Neural networks; Noise measurement;
                 optimisation; pattern clustering;
                 permutation-invariantly trained neural network;
                 sequential grouping; simultaneous grouping; speaker
                 recognition; speaker separation; speaker tracking;
                 speech processing; Speech processing;
                 talker-independent monaural speaker separation;
                 Training; WSJ0-2mix database",

  author =       "X. Liu and D. F. Wong and L. S. Chao and Y. Liu",
  title =        "Latent Attribute Based Hierarchical Decoder for Neural
                 Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2103--2112",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "attribute level; Computational modeling; Decoding;
                 decoding; decoding process; decoding time; dynamic
                 hierarchical decoder; English-German translation tasks;
                 hierarchical decoder; language translation; Latent
                 attribute; latent attribute vectors; learning
                 (artificial intelligence); limited vocabulary;
                 linguistic attributes; Linguistics; natural language
                 processing; neural machine translation; neural machine
                 translation (NMT); NMT baselines; Semantics; Speech
                 processing; target word; Training; translation quality;
                 Vocabulary; word vector",

  author =       "J. Hu and N. Chen",
  title =        "Enhanced Feature Summarizing for Effective Cover Song
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2113--2126",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustic measurements; audio signal processing;
                 combined representative feature; cover song
                 identification; Cover Song Identification (CSI);
                 cross-similarity calculating stage; cross-similarity
                 calculating strategies; Feature extraction; feature
                 extraction; feature subsequence community; Feature
                 Summarizing; feature summarizing stage; gene-function
                 prediction accuracy; Hubness Reduction (HR); Hubness
                 Reduction strategy; Hubness' phenomenon; identification
                 accuracy; information retrieval; melody
                 perception-based similarity; memory efficiency; music;
                 Music; Network Enhancement (NE); Network Enhancement
                 technique; Noise measurement; performance enhancement;
                 retrieval effectiveness; self-similarity analysis-based
                 feature; Self-Similarity Matrix (SSM); self-similarity
                 network; Speech processing; statistical analysis; SuCo
                 model; summarized representative feature subsequences;
                 Thumb; unsummarized feature sequence",

  author =       "Q. Ma and L. Yu and S. Tian and E. Chen and W. W. Y.
  title =        "Global-Local Mutual Attention Model for Text
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2127--2139",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Computational modeling; Convolutional Neural Network
                 (CNN); discriminative features; feature extraction;
                 Feature extraction; global long-term dependencies;
                 global-guided local-attention; global-local mutual
                 attention model; informative features; key local
                 semantic information; learning (artificial
                 intelligence); local-guided global-attention; mutual
                 attention mechanism; Mutual Attention Mechanism; mutual
                 attention weights; mutual learning; natural language
                 processing; Natural language processing; pattern
                 classification; Recurrent Neural Network (RNN);
                 Recurrent neural networks; relevant local semantic
                 features; Semantics; Task analysis; text analysis; Text
                 Classification; text classification problems;
                 Visualization; Weighted-over-time Pooling;
                 weighted-over-time pooling operation",

  author =       "V. V{\"a}lim{\"a}ki and J. R{\"a}m{\"o}",
  title =        "Neurally Controlled Graphic Equalizer",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2140--2149",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Audio systems; Bandwidth; equalisers; Equalizers;
                 equalizers; feedforward neural nets; feedforward neural
                 network based method; feedforward neural networks;
                 filter gain control; filtering theory; Gain; gain
                 control; Graphics; IIR filters; learning (artificial
                 intelligence); least-square design method; matrix
                 inversion; music processing applications; neurally
                 controlled graphic equalizer; neurocontrollers; noise
                 figure 0.1 dB; Optimization; optimized band filter gain
                 coefficients; Speech processing; supervised learning;
                 telecommunication control; ten-octave graphic
                 equalization design; time-varying equalization",

  author =       "S. U. N. Wood and J. K. W. Stahl and P. Mowlaee",
  title =        "Binaural Codebook-Based Speech Enhancement With Atomic
                 Speech Presence Probability",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2150--2161",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "ASPP estimators; ASPP-based speech enhancement
                 algorithms; atomic speech presence probability;
                 binaural codebook-based speech enhancement; binaural
                 cue preservation; binaural cues; binaural mixtures;
                 binaural noise reduction; Binaural speech enhancement;
                 binaural speech enhancement benchmark methods; binaural
                 STOI metrics; Estimation; given codebook atom; Indexes;
                 interaural coherence magnitude; interaural phase;
                 interaural transfer function; ITF-based ASPP approach;
                 level difference; Noise measurement; Noise reduction;
                 nonnegative matrix factorization; objective speech
                 quality; PESQ metrics; probability; reverberant speech;
                 reverberation; signal denoising; single codebook;
                 speech coding; Speech coding; Speech enhancement;
                 speech enhancement; speech intelligibility; transfer
                 functions; universal codebook-based speech enhancement

  author =       "L. Pfeifenberger and M. Z{\"o}hrer and F. Pernkopf",
  title =        "Eigenvector-Based Speech Mask Estimation for
                 Multi-Channel Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2162--2172",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustics; Array signal processing; array signal
                 processing; CHiME4 corpora; Direction-of-arrival
                 estimation; eigennet architecture; eigenvalues and
                 eigenfunctions; Eigenvector beamforming; eigenvector
                 features; eigenvector-based speech mask estimation;
                 estimation theory; filtering theory; generalized
                 eigenvalue beamformers; GEV; Kaldi speech-to-text API;
                 microphones; Microphones; minimum variance
                 distortionless response; Multi-channel speech
                 enhancement; multichannel microphone observations;
                 multichannel speech enhancement; MVDR; Neural Networks;
                 Noise measurement; PAN postfilter; phase aware
                 normalization postfilter; Signal to noise ratio; SNR;
                 Speech enhancement; speech enhancement; speech mask
                 estimation; WER; word error rate; WSJ0 corpora",

  author =       "M. Arnela and S. Dabbaghchian and O. Guasch and O.
  title =        "{MRI}-Based Vocal Tract Representations for the
                 Three-Dimensional Finite Element Synthesis of
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2173--2182",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "3D dynamic vocal tract representations; acoustic wave
                 propagation; acoustic waves; adaptive grid; adjacent
                 cross-sections; Au; biomedical MRI; cross-section
                 orientations; diphthongs; finite element analysis;
                 Finite element analysis; Finite Element Method;
                 Geometry; Interpolation; magnetic resonance imaging;
                 Magnetic resonance imaging; mixed wave equation;
                 MRI-based vocal tract geometries; MRI-based vocal tract
                 representations; semi-polar grid; semi-polar grid
                 strategy; Shape; Solid modeling; spatial resolution;
                 speech; speech processing; speech synthesis; SPG
                 dynamic vocal tract representation; static sounds;
                 static vowel sounds; Three-dimensional displays;
                 three-dimensional finite element synthesis; Vocal tract
                 acoustics; vocal tract midline; wave equations",

  author =       "K. Sekiguchi and Y. Bando and A. A. Nugraha and K.
                 Yoshii and T. Kawahara",
  title =        "Semi-Supervised Multichannel Speech Enhancement With a
                 Deep Speech Prior",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2197--2212",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Data models; deep learning; Maximum likelihood
                 estimation; Multichannel speech enhancement; Noise
                 measurement; nonnegative matrix factorization;
                 Probabilistic logic; Speech enhancement; Time-frequency
                 analysis; variational autoencoder",

  author =       "Q. Guo and X. Qiu and X. Xue and Z. Zhang",
  title =        "Low-Rank and Locality Constrained Self-Attention for
                 Sequence Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2213--2222",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Bit error rate; Data models; deep learning;
                 Linguistics; Matrix decomposition; Natural language
                 processing; self-attention; Sequence modeling; Sparse
                 matrices; Task analysis; transformer",

  author =       "J. Yu and Q. Ling and C. Luo and C. W. Chen",
  title =        "Synthesizing {$3$D} {Trump}: Predicting and
                 Visualizing the Relationship Between Text, Speech, and
                 Articulatory Movements",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2223--2233",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustics; Animation; Feature extraction; Head;
                 Linguistics; speech animation; Three-dimensional
                 displays; Visual co-articulation; Visualization",

  author =       "R. Sugiura and Y. Kamamoto and T. Moriya",
  title =        "Shape Control of Discrete Generalized {Gaussian}
                 Distributions for Frequency-Domain Audio Coding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2234--2248",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Audio compression; Computational modeling; entropy
                 coding; generalized Gaussian distribution; Laplace
                 equations; Psychoacoustic models; Shape; Speech coding;
                 Speech processing",

  author =       "Z. Ben-Hur and D. L. Alon and R. Mehra and B.
  title =        "Efficient Representation and Sparse Sampling of
                 Head-Related Transfer Functions Using Phase-Correction
                 Based on Ear Alignment",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2249--2262",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Ear; Finite wordlength effects; Frequency-domain
                 analysis; head-related transfer functions (HRTFs);
                 Interpolation; Spatial audio; Spatial resolution;
                 Speech processing; spherical-harmonics; Transfer

  author =       "L. Remaggi and P. J. B. Jackson and W. Wang",
  title =        "Modeling the Comb Filter Effect and Interaural
                 Coherence for Binaural Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2263--2277",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "binaural audio; Coherence; comb filter effect; ILD;
                 Integrated circuit modeling; interaural coherence; IPD;
                 multipath propagation; Reverberation; RIRs; Source
                 separation; Speech processing",

  author =       "B. Zhang and D. Xiong and J. Su and J. Luo",
  title =        "Future-Aware Knowledge Distillation for Neural Machine
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2278--2287",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Computational modeling; Context modeling; Decoding;
                 Future context; History; knowledge distillation;
                 natural language processing; neural machine
                 translation; Predictive models; Semantics; Training",

  author =       "R. Ali and T. {Van Waterschoot} and M. Moonen",
  title =        "Integration of a Priori and Estimated Constraints Into
                 an {MVDR} Beamformer for Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2288--2300",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Acoustic distortion; Acoustics; Beamforming;
                 Correlation; Microphone arrays; Minimum Variance
                 Distortionless Response (MVDR) Beamformer;
                 Multi-Microphone Noise Reduction; Speech Enhancement;
                 Speech enhancement; Tuning",

  author =       "N. Tiwari and P. C. Pandey",
  title =        "Speech Enhancement Using Noise Estimation With Dynamic
                 Quantile Tracking",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2301--2312",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Dynamic quantile tracking; Estimation; hearing aids;
                 Indexes; Microsoft Windows; noise estimation; Noise
                 measurement; Smoothing methods; speech communication
                 devices; speech enhancement; Speech enhancement",

  author =       "J. Duan and X. Ding and Y. Zhang and T. Liu",
  title =        "{TEND}: A Target-Dependent Representation Learning
                 Framework for News Document",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2313--2325",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Document Representation; Internet; Logic gates; Neural
                 networks; Speech processing; Stance Detection; Stock
                 Market Prediction; Target-dependent Representation;
                 Task analysis; Text mining; Twitter",

  author =       "L. Zhao and X. Qiu and Q. Zhang and X. Huang",
  title =        "Sequence Labeling With Deep Gated Dual Path {CNN}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2326--2335",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Context modeling; convolutional neural networks;
                 Hidden Markov models; Labeling; Logic gates; Natural
                 language processing; recurrent neural networks;
                 Recurrent neural networks; Sequence labeling; Task

  author =       "A. Kato and T. H. Kinnunen",
  title =        "Statistical Regression Models for Noise Robust {F0}
                 Estimation Using Recurrent Deep Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2336--2349",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Estimation; F0; Fundamental frequency; Hidden Markov
                 models; Noise robustness; pitch; Recurrent neural
                 networks; recurrent neural networks; regression model;
                 Speech processing; Task analysis; waveform-to-sinusoid

  author =       "D. Liu and J. Fu and Q. Qu and J. Lv",
  title =        "{BFGAN}: Backward and Forward Generative Adversarial
                 Networks for Lexically Constrained Sentence
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2350--2361",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "Force; Gallium nitride; generative adversarial
                 networks; Generators; Lexically constrained sentence
                 generation; natural language generation; Natural
                 languages; Search problems; Task analysis; Training",

  author =       "A. Marafioti and N. Perraudin and N. Holighaus and P.
  title =        "A Context Encoder For Audio Inpainting",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2362--2372",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "frequency-domain analysis; Image reconstruction;
                 Instruments; machine learning; Music; Prediction
                 algorithms; Psychoacoustic models; Reliability; signal
                 processing algorithms; Time-domain analysis",

  author =       "J. Yang and R. K. Das and N. Zhou",
  title =        "Extraction of Octave Spectra Information for Spoofing
                 Attack Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "27",
  number =       "12",
  pages =        "2373--2384",
  month =        dec,
  year =         "2019",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Fri Nov 29 16:54:01 2019",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";
  keywords =     "constant-Q multi-level coefficients (CMC); Data
                 mining; Discrete cosine transforms; Feature extraction;
                 High frequency; Mel frequency cepstral coefficient;
                 Multi-level transform (MLT); replay speech detection;
                 synthetic speech detection",

  author =       "Jamal Amini and Richard Christian Hendriks and Richard
                 Heusdens and Meng Guo and Jesper Jensen",
  title =        "Rate-Constrained Noise Reduction in Wireless Acoustic
                 Sensor Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "1--12",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "Wireless acoustic sensor networks (WASNs) can be used
                 for centralized multi-microphone noise reduction, where
                 the processing is done in a fusion center (FC). To
                 perform the noise reduction, the data needs to be
                 transmitted to the FC. Considering the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chitralekha Gupta and Haizhou Li and Ye Wang",
  title =        "Automatic Leaderboard: Evaluation of Singing Quality
                 Without a Standard Reference",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "13--26",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "Automatic evaluation of singing quality can be done
                 with the help of a reference singing or the digital
                 sheet music of the song. However, such a standard
                 reference is not always available. In this article, we
                 propose a framework to rank a large pool of \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sefik Emre Eskimez and Ross K. Maddox and Chenliang Xu
                 and Zhiyao Duan",
  title =        "Noise-Resilient Training Method for Face Landmark
                 Generation From Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "27--38",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "Visual cues such as lip movements, when available,
                 play an important role in speech communication. They
                 are especially helpful for the hearing impaired
                 population or in noisy environments. When not
                 available, having a system to automatically generate
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Peidong Wang and Ke Tan and De Liang Wang",
  title =        "Bridging the Gap Between Monaural Speech Enhancement
                 and Recognition With Distortion-Independent Acoustic
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "39--48",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "Monaural speech enhancement has made dramatic advances
                 since the introduction of deep learning a few years
                 ago. Although enhanced speech has been demonstrated to
                 have better intelligibility and quality for human
                 listeners, feeding it directly to automatic \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuki Mitsufuji and Stefan Uhlich and Norihiro Takamune
                 and Daichi Kitamura and Shoichi Koyama and Hiroshi
  title =        "Multichannel Non-Negative Matrix Factorization Using
                 Banded Spatial Covariance Matrices in Wavenumber
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "49--60",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "Blind source separation exploiting multichannel
                 information has long been a popular topic, and recently
                 proposed methods based on the local Gaussian model have
                 shown promising results despite its high computational
                 cost for the case of many microphone \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yaron Laufer and Sharon Gannot",
  title =        "Scoring-Based {ML} Estimation and {CRBs} for
                 Reverberation, Speech, and Noise {PSDs} in a Spatially
                 Homogeneous Noise Field",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "61--76",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "Hands-free speech systems are subject to performance
                 degradation due to reverberation and noise. Common
                 methods for enhancing reverberant and noisy speech
                 require the knowledge of the speech, reverberation and
                 noise power spectral densities (PSDs). Most \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Naveen Kumar Desiraju and Simon Doclo and Markus Buck
                 and Tobias Wolff",
  title =        "Online Estimation of Reverberation Parameters For Late
                 Residual Echo Suppression",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "77--91",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "In hands-free telephony and other distant-talk
                 applications, often a short AEC filter is used to
                 achieve fast convergence at low computational cost. As
                 a result, a significant amount of late residual echo
                 (LRE) may remain, especially in highly reverberant
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mehdi Zohourian and Rainer Martin",
  title =        "Binaural Direct-to-Reverberant Energy Ratio and
                 Speaker Distance Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "92--104",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "This article addresses the problem of distance
                 estimation using binaural hearing aid microphones in
                 reverberant rooms. Among several distance indicators,
                 the direct-to-reverberant energy ratio (DRR) has been
                 shown to be more effective than other features.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Youhyun Shin and Sang-goo Lee",
  title =        "Learning Context Using Segment-Level {LSTM} for Neural
                 Sequence Labeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "105--115",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "This article introduces an approach that learns
                 segment-level context for sequence labeling in natural
                 language processing (NLP). Previous approaches limit
                 their basic unit to a word for feature extraction
                 because sequence labeling is a token-level task
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Gongping Huang and Jingdong Chen and Jacob Benesty",
  title =        "Design of Planar Differential Microphone Arrays With
                 Fractional Orders",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "116--130",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "Differential microphone arrays (DMAs) often encounter
                 white noise amplification, especially at low
                 frequencies. If the array geometry and the number of
                 microphones are fixed, one can improve the white noise
                 amplification problem by reducing the DMA order.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ming-Hsiang Su and Chung-Hsien Wu and Liang-Yu Chen",
  title =        "Attention-Based Response Generation Using Parallel
                 Double {Q}-Learning for Dialog Policy Decision in a
                 Conversational System",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "131--143",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "This article proposes an approach to response
                 generation using a Parallel Double Q-learning algorithm
                 for dialog policy decision in a conversational system.
                 First, a new semantic representation of the
                 user\&\#x0027;s input sentence is presented by using
                 the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Satoru Emura",
  title =        "Wave-Domain Residual Echo Reduction Using Subspace
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "144--156",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "This article proposes a wave-domain residual echo
                 reduction method for two-way immersive sound
                 communication, which is based on wave field synthesis
                 and uses uniform linear arrays of loudspeakers and
                 microphones. This method is intended to improve the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xin Wang and Shinji Takaki and Junichi Yamagishi and
                 Simon King and Keiichi Tokuda",
  title =        "A Vector Quantized Variational Autoencoder {(VQ-VAE)}
                 Autoregressive Neural {$ F_0 $} Model for Statistical
                 Parametric Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "157--170",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "Recurrent neural networks (RNNs) can predict
                 fundamental frequency (F0) for statistical parametric
                 speech synthesis systems, given linguistic features as
                 input. However, these models assume conditional
                 independence between consecutive \ldots{}.",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Falk-Martin Hoffmann and Philip Arthur Nelson and
                 Filippo Maria Fazi",
  title =        "{DOA} Estimation Performance With Circular Arrays in
                 Sound Fields With Finite Rate of Innovation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "171--184",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "A novel Direction-of-Arrival (DOA) estimation method
                 based on a plane wave sound field model was recently
                 proposed for circular microphone
                 arrays\&\#x00A0;{$<$}xref ref-type=``bibr''
                 rid=``ref1''{$>$}[1]{$<$}/{xref$>$}. This article
                 presents a detailed theoretical analysis of \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rongfeng Su and Xunying Liu and Lan Wang and Jingzhou
  title =        "Cross-Domain Deep Visual Feature Generation for
                 {Mandarin} Audio--Visual Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "185--197",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "There has been a long term interest in using visual
                 information to improve automatic speech recognition
                 (ASR) system performance. Both audio and visual
                 information are required in conventional audio visual
                 speech recognition (AVSR) systems. This limits
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Titouan Parcollet and Mohamed Morchid and Xavier Bost
                 and Georges Linar{\`e}s and Renato {De Mori}",
  title =        "Real to {H}-Space Autoencoders for Theme
                 Identification in Telephone Conversations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "198--210",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "Machine learning (ML) and deep learning with deep
                 neural networks (DNN), have drastically improved the
                 performances of modern systems on numerous spoken
                 language understanding (SLU) related tasks. Since most
                 of current researches focus on new neural \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Antonio Canclini and Fabio Antonacci and Stefano
                 Tubaro and Augusto Sarti",
  title =        "A Methodology for the Robust Estimation of the
                 Radiation Pattern of Acoustic Sources",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "211--224",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "We propose a novel methodology for estimating the
                 radiation pattern of acoustic sources, which is general
                 enough as to be suitable for a wide variety of sources
                 without the need of anechoic conditions of operation.
                 Multiple plenacoustic cameras (which can \ldots{}).",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi Yu and Hongsen He and Badong Chen and Jianghui Li
                 and Youwen Zhang and Lu Lu",
  title =        "{$M$}-Estimate Based Normalized Subband Adaptive
                 Filter Algorithm: Performance Analysis and
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "225--239",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "This article studies the mean and mean-square
                 behaviors of the M-estimate based normalized subband
                 adaptive filter algorithm (M-NSAF) with robustness
                 against impulsive noise. Based on the
                 contaminated-Gaussian noise model, the stability
                 condition, \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hao-Xiang Wen and Sen-Quan Yang and Yuan-Quan Hong and
                 Huan Luo",
  title =        "A Partial Update Adaptive Algorithm for Sparse System
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "240--255",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "A sparse partial update (SPU) algorithm and its
                 improved version improved SPU (ISPU) algorithm, are
                 proposed in this paper for sparse system
                 identification. The SPU first categorizes its filter
                 coefficients into active and inactive coefficients.
                 Then all \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Martin Bo M{\o}ller and Jan {\O}stergaard",
  title =        "A Moving Horizon Framework for Sound Zones",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "256--265",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "Sound zones are generated to provide independent audio
                 reproduction to multiple people in the same room using
                 loudspeakers. In this article, sound zones are
                 formulated in terms of a moving horizon framework. This
                 framework allows the reproduction scenario \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Stylianos Ioannis Mimilakis and Konstantinos Drossos
                 and Estefan{\'\i}a Cano and Gerald Schuller",
  title =        "Examining the Mapping Functions of Denoising
                 Autoencoders in Singing Voice Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "266--278",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "The goal of this article is to investigate what
                 singing voice separation approaches based on neural
                 networks learn from the data. We examine the mapping
                 functions of neural networks based on the denoising
                 autoencoder (DAE) model that are conditioned on
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lachlan I. Birnie and Thushara D. Abhayapala and
                 Prasanga N. Samarasinghe",
  title =        "Reflection Assisted Sound Source Localization Through
                 a Harmonic Domain {MUSIC} Framework",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "279--293",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "This work presents a method that persuades acoustic
                 reflections to be a favorable property for sound source
                 localization. Whilst most real world spatial audio
                 applications utilize prior knowledge of sound source
                 position, estimating such positions in \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wenhao Ding and Liang He",
  title =        "Adaptive Multi-Scale Detection of Acoustic Events",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "294--306",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "The goal of acoustic (or sound) events detection (AED
                 or SED) is to predict the temporal position of target
                 events in given audio segments. This task plays a
                 significant role in safety monitoring, acoustic early
                 warning and other scenarios. However, the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Weijian Zhang and Peng Song",
  title =        "Transfer Sparse Discriminant Subspace Learning for
                 Cross-Corpus Speech Emotion Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "307--318",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "Cross-corpus speech emotion recognition has attracted
                 much attention due to the widespread existence of
                 various emotional speech in life. It takes one corpus
                 for training and another corpus for testing, and
                 generally involves the following two basic \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bidisha Sharma and Ye Wang",
  title =        "Automatic Evaluation of Song Intelligibility Using
                 Singing Adapted {STOI} and Vocal-Specific Features",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "319--331",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "An objective machine-driven measure of song
                 intelligibility would be of great utility for various
                 music information retrieval tasks. Song intelligibility
                 mostly depends on two factors, the amount of
                 interference caused by background accompaniment, and
                 the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hai Morgenstern and Boaz Rafaely",
  title =        "Perceptually-Transparent Online Estimation of
                 Two-Channel Room Transfer Function for Sound
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "332--342",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "Sound calibration is employed in many commercial audio
                 systems for improving sound quality. This process
                 includes the estimation of the room transfer function
                 (RTF) between each loudspeaker and a microphone located
                 at the listeners\&\#x2019; position. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shaojin Ding and Guanlong Zhao and Christopher
                 Liberatore and Ricardo Gutierrez-Osuna",
  title =        "Learning Structured Sparse Representations for Voice
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "343--354",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "Sparse-coding techniques for voice conversion assume
                 that an utterance can be decomposed into a sparse code
                 that only carries linguistic contents, and a dictionary
                 of atoms that captures the speakers\&\#x2019;
                 characteristics. However, conventional \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mireia Diez and Luk{\'a}{\v{s}} Burget and Federico
                 Landini and Jan {\v{C}}ernock{\'y}",
  title =        "Analysis of Speaker Diarization Based on {Bayesian}
                 {HMM} With Eigenvoice Priors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "355--368",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "In our previous work, we introduced our Bayesian
                 Hidden Markov Model with eigenvoice priors, which has
                 been recently recognized as the state-of-the-art model
                 for Speaker Diarization. In this article we present a
                 more complete analysis of the Diarization \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jia-Chen Gu and Zhen-Hua Ling and Quan Liu",
  title =        "Utterance-to-Utterance Interactive Matching Network
                 for Multi-Turn Response Selection in Retrieval-Based
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "369--379",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "This article proposes an utterance-to-utterance
                 interactive matching network (U2U-IMN) for multi-turn
                 response selection in retrieval-based chatbots.
                 Different from previous methods following
                 context-to-response matching or utterance-to-response
                 matching \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ke Tan and DeLiang Wang",
  title =        "Learning Complex Spectral Mapping With Gated
                 Convolutional Recurrent Networks for Monaural Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "380--390",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Sat Aug 15 09:50:40 MDT 2020",
  bibsource =    "",
  URL =          "",
  abstract =     "Phase is important for perceptual quality of speech.
                 However, it seems intractable to directly estimate
                 phase spectra through supervised learning due to their
                 lack of spectrotemporal structure in it. Complex
                 spectral mapping aims to estimate the real and
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Richeng Duan and Tatsuya Kawahara and Masatake
                 Dantsuji and Hiroaki Nanjo",
  title =        "Cross-Lingual Transfer Learning of Non-Native Acoustic
                 Modeling for Pronunciation Error Detection and
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "391--401",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "In computer-assisted pronunciation training (CAPT),
                 the scarcity of large-scale non-native corpora and
                 human expert annotations are two fundamental challenges
                 to non-native acoustic modeling. Most existing
                 approaches of acoustic modeling in CAPT are based
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xin Wang and Shinji Takaki and Junichi Yamagishi",
  title =        "Neural Source-Filter Waveform Models for Statistical
                 Parametric Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "402--415",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Neural waveform models have demonstrated better
                 performance than conventional vocoders for statistical
                 parametric speech synthesis. One of the best models,
                 called WaveNet, uses an autoregressive (AR) approach to
                 model the distribution of waveform sampling \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sanjeel Parekh and Slim Essid and Alexey Ozerov and
                 Ngoc Q. K. Duong and Patrick P{\'e}rez and Ga{\"e}l
  title =        "Weakly Supervised Representation Learning for
                 Audio-Visual Scene Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "416--428",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Audio-visual (AV) representation learning is an
                 important task from the perspective of designing
                 machines with the ability to understand complex events.
                 To this end, we propose a novel multimodal framework
                 that instantiates multiple instance learning.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jianfei Yu and Jing Jiang and Rui Xia",
  title =        "Entity-Sensitive Attention and Fusion Network for
                 Entity-Level Multimodal Sentiment Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "429--439",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Entity-level (aka target-dependent) sentiment analysis
                 of social media posts has recently attracted increasing
                 attention, and its goal is to predict the sentiment
                 orientations over individual target entities mentioned
                 in users\&\#x2019; posts. Most existing \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "John G. Beerends and Niels M. P. Neumann and Egon L.
                 van den Broek and Anna Llagostera Casanovas and Jovana
                 Torres Menendez and Christian Schmidmer and Jens
  title =        "Subjective and Objective Assessment of Full Bandwidth
                 Speech Quality",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "440--449",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "With the introduction of fullband speech coding the
                 question arises what role frequency components above
                 14\&\#x00A0;kHz play in speech quality assessment. On
                 the one hand, our results show that bandwidth
                 limitation from 24\&\#x00A0;kHz down to 14\&\#x00A0;kHz
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Vikram C. Mathad and S. R. Mahadeva Prasanna",
  title =        "Vowel Onset Point Based Screening of Misarticulated
                 Stops in Cleft Lip and Palate Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "450--460",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "The presence of velopharyngeal dysfunction, dental
                 occlusion, and mislearned articulation in individuals
                 with cleft lip and palate (CLP) results in the
                 production of misarticulated stop consonants. The
                 present work considers vowel onset points (VOPs) as
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Minh Nguyen and Gia H. Ngo and Nancy F. Chen",
  title =        "Hierarchical Character Embeddings: Learning
                 Phonological and Semantic Representations in Languages
                 of Logographic Origin Using Recursive Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "461--473",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Logographs (Chinese characters) have recursive
                 structures (i.e. hierarchies of sub-units in
                 logographs) that contain phonological and semantic
                 information, as developmental psychology literature
                 suggests that native speakers leverage on the
                 structures to \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dani Cherkassky and Sharon Gannot",
  title =        "Successive Relative Transfer Function Identification
                 Using Blind Oblique Projection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "474--486",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Distortionless speech extraction in a reverberant
                 environment can be achieved by applying a beamforming
                 algorithm, provided that the relative transfer
                 functions (RTFs) of the sources and the covariance
                 matrix of the noise are known. In this paper, the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ivo Trowitzsch and Christopher Schymura and Dorothea
                 Kolossa and Klaus Obermayer",
  title =        "Joining Sound Event Detection and Localization Through
                 Spatial Segregation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "487--502",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Identification and localization of sounds are both
                 integral parts of computational auditory scene
                 analysis. Although each can be solved separately, the
                 goal of forming coherent auditory objects and achieving
                 a comprehensive spatial scene understanding \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shinichi Mogami and Norihiro Takamune and Daichi
                 Kitamura and Hiroshi Saruwatari and Yu Takahashi and
                 Kazunobu Kondo and Nobutaka Ono",
  title =        "Independent Low-Rank Matrix Analysis Based on
                 Time-Variant Sub-{Gaussian} Source Model for Determined
                 Blind Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "503--518",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Independent low-rank matrix analysis (ILRMA) is a fast
                 and stable method of blind audio source separation.
                 Conventional ILRMAs assume time-variant
                 (super-)Gaussian source models, which can only
                 represent signals that follow a super-Gaussian
                 distribution. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hamzeh Ghasemzadeh and Meisam K. Arjmandi",
  title =        "Toward Optimum Quantification of Pathology-Induced
                 Noises: an Investigation of Information Missed by Human
                 Auditory System",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "519--528",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Clinical diagnosis of voice disorder and evaluation of
                 therapy outcome heavily rely on accurate quantification
                 of voice quality, which is closely tied to the
                 physiology and function of the laryngeal mechanism.
                 Considering the evaluation methodology of the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Fei Ma and Wen Zhang and Thushara Dheemantha
  title =        "Active Control of Outgoing Broadband Noise Fields in
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "529--539",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Active noise control system has been actively
                 researched over the past half century, and implemented
                 to reduce noises in ducts, headsets, and inside several
                 automobile models. However, active control of noise
                 fields, and specifically broadband noise \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jing-Xuan Zhang and Zhen-Hua Ling and Li-Rong Dai",
  title =        "Non-Parallel Sequence-to-Sequence Voice Conversion
                 With Disentangled Linguistic and Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "540--552",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "This article presents a method of sequence-to-sequence
                 (seq2seq) voice conversion using non-parallel training
                 data. In this method, disentangled linguistic and
                 speaker representations are extracted from acoustic
                 features, and voice conversion is achieved \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tao Dai and Li Zhu and Yaxiong Wang and Kathleen M.
  title =        "Attentive Stacked Denoising Autoencoder With {Bi-LSTM}
                 for Personalized Context-Aware Citation
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "553--568",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "The rapid growth of scientific publications brings the
                 problem of finding appropriate citations for authors.
                 Context-aware citation recommendation is an essential
                 technology to overcome this obstacle when given a
                 fragment of manuscript. In this article, \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuta Nishimura and Katsuhito Sudoh and Graham Neubig
                 and Satoshi Nakamura",
  title =        "Multi-Source Neural Machine Translation With Missing
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "569--580",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Machine translation is rife with ambiguities in word
                 ordering and word choice, and even with the advent of
                 machine-learning methods that learn to resolve this
                 ambiguity based on statistics from large corpora,
                 mistakes are frequent. Multi-source \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jin Wang and Liang-Chih Yu and K. Robert Lai and
                 Xuejie Zhang",
  title =        "Tree-Structured Regional {CNN-LSTM} Model for
                 Dimensional Sentiment Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "581--591",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Dimensional sentiment analysis aims to recognize
                 continuous numerical values in multiple dimensions such
                 as the valence-arousal (VA) space. Compared to the
                 categorical approach that focuses on sentiment
                 classification such as binary classification (i.e.,
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Abul Azad and Lamine Mili",
  title =        "Robust Speech Filter and Voice Encoder Parameter
                 Estimation Using the Phase--Phase Correlator",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "592--604",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "In recent years, linear prediction voice encoders have
                 become very efficient in terms of computing execution
                 time and channel bandwidth usage while providing, in
                 the absence of impulsive noise, natural sounding
                 synthetic speech signals. This good \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Abdullah Fahim and Prasanga N. Samarasinghe and
                 Thushara D. Abhayapala",
  title =        "Multi-Source {DOA} Estimation Through Pattern
                 Recognition of the Modal Coherence of a Reverberant
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "605--618",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "We propose a novel multi-source direction of arrival
                 (DOA) estimation technique using a convolutional neural
                 network algorithm which learns the modal coherence
                 patterns of an incident soundfield through measured
                 spherical harmonic coefficients. We train \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yaron Laufer and Bracha Laufer-Goldshtein and Sharon
  title =        "{ML} Estimation and {CRBs} for Reverberation, Speech,
                 and Noise {PSDs} in Rank-Deficient Noise Field",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "619--634",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech communication systems are prone to performance
                 degradation in reverberant and noisy acoustic
                 environments. Dereverberation and noise reduction
                 algorithms typically require several model parameters,
                 e.g.\&\#x00A0;the speech, reverberation and noise
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhongqing Wang and Qingying Sun and Shoushan Li and
                 Qiaoming Zhu and Guodong Zhou",
  title =        "Neural Stance Detection With Hierarchical Linguistic
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "635--645",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Stance detection aims to assign a stance label (i.e.,
                 favor or against) to a post towards a specific target.
                 Recently, there is a growing interest in adopting
                 neural models to detect stance of a document. However,
                 most of \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ruizhi Li and Xiaofei Wang and Sri Harish Mallidi and
                 Shinji Watanabe and Takaaki Hori and Hynek Hermansky",
  title =        "Multi-Stream End-to-End Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "646--655",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Attention-based methods and Connectionist Temporal
                 Classification (CTC) network have been promising
                 research directions for end-to-end (E2E) Automatic
                 Speech Recognition (ASR). The joint CTC/Attention model
                 has achieved great success by utilizing both \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yu Maeno and Yuki Mitsufuji and Prasanga N.
                 Samarasinghe and Naoki Murata and Thushara D.
  title =        "Spherical-Harmonic-Domain Feedforward Active Noise
                 Control Using Sparse Decomposition of Reference Signals
                 from Distributed Sensor Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "656--670",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Active acoustic noise attenuation over a sizable space
                 is a challenging problem in signal processing. The
                 noise attenuation performance of feedforward active
                 noise control (ANC) relies on the preciseness of a
                 reference signal of a primary noise field. To
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qingyu Zhou and Nan Yang and Furu Wei and Shaohan
                 Huang and Ming Zhou and Tiejun Zhao",
  title =        "A Joint Sentence Scoring and Selection Framework for
                 Neural Extractive Document Summarization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "671--681",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Extractive document summarization methods aim to
                 extract important sentences to form a summary. Previous
                 works perform this task by first scoring all sentences
                 in the document then selecting most informative ones;
                 while we propose to jointly learn the two \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ivan Kukanov and Trung Ngo Trong and Ville
                 Hautam{\"a}ki and Sabato Marco Siniscalchi and Valerio
                 Mario Salerno and Kong Aik Lee",
  title =        "Maximal Figure-of-Merit Framework to Detect
                 Multi-Label Phonetic Features for Spoken Language
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "682--695",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Bottleneck features (BNFs) generated with a deep
                 neural network (DNN) have proven to boost spoken
                 language recognition accuracy over basic spectral
                 features significantly. However, BNFs are commonly
                 extracted using language-dependent tied-context phone
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shoichi Koyama and Gilles Chardon and Laurent Daudet",
  title =        "Optimizing Source and Sensor Placement for Sound Field
                 Control: an Overview",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "696--714",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "In order to control an acoustic field inside a target
                 region, it is important to choose suitable positions of
                 secondary sources (loudspeakers) and sensors (control
                 points/microphones). This article provides an overview
                 of state-of-the-art source and \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Atsushi Ando and Ryo Masumura and Hosana Kamiyama and
                 Satoshi Kobashikawa and Yushi Aono and Tomoki Toda",
  title =        "Customer Satisfaction Estimation in Contact Center
                 Calls Based on a Hierarchical Multi-Task Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "715--728",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "This article presents a novel customer
                 satisfaction\&\#x00A0;(CS) estimation method that
                 outputs both turn-level and call-level estimations
                 simultaneously. Our key idea is to directly apply
                 turn-level estimation results to call-level estimation
                 and optimize \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Thomas Dietzen and Simon Doclo and Marc Moonen and
                 Toon van Waterschoot",
  title =        "Integrated Sidelobe Cancellation and Linear Prediction
                 {Kalman} Filter for Joint Multi-Microphone Speech
                 Dereverberation, Interfering Speech Cancellation, and
                 Noise Reduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "740--754",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "In multi-microphone speech enhancement, reverberation
                 as well as additive noise and/or interfering speech are
                 commonly suppressed by deconvolution and spatial
                 filtering, e.g., using multi-channel linear prediction
                 (MCLP) on the one hand and beamforming, \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Thomas Dietzen and Simon Doclo and Marc Moonen and
                 Toon van Waterschoot",
  title =        "Square Root-Based Multi-Source Early {PSD} Estimation
                 and Recursive {RETF} Update in Reverberant Environments
                 by Means of the Orthogonal {Procrustes} Problem",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "755--769",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Multi-channel short-time Fourier transform (STFT)
                 domain-based processing of reverberant microphone
                 signals commonly relies on power-spectral-density (PSD)
                 estimates of early source images, where early refers to
                 reflections contained within the same STFT \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Liwen Zhang and Ziqiang Shi and Jiqing Han",
  title =        "Pyramidal Temporal Pooling With Discriminative Mapping
                 for Audio Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "770--784",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Audio signals are temporally-structured data, and
                 learning their discriminative representations
                 containing temporal information is crucial for the
                 audio classification. In this article, we propose an
                 audio representation learning method with a \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mengfan Zhang and Zhongshu Ge and Tiejun Liu and
                 Xihong Wu and Tianshu Qu",
  title =        "Modeling of Individual {HRTFs} Based on Spatial
                 Principal Component Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "28",
  number =       "??",
  pages =        "785--797",
  month =        jan,
  year =         "2020",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu May 27 17:56:35 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Head-related transfer function (HRTF) plays an
                 important role in the construction of 3D auditory
                 display. This article presents an individual HRTF
                 modeling method using deep neural networks based on
                 spatial principal component analysis. The HRTFs are
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bijue Jia and Jiancheng Lv and Xi Peng and Yao Chen
                 and Shenglan Yang",
  title =        "Hierarchical Regulated Iterative Network for Joint
                 Task of Music Detection and Music Relative Loudness
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1--13",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "One practical requirement of the music copyright
                 management is the estimation of music relative
                 loudness, which is mostly ignored in existing music
                 detection works. To solve this problem, we study the
                 joint task of music detection and music relative
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Nauman Dawalatabad and Srikanth Madikeri and C.
                 Chandra Sekhar and Hema A. Murthy",
  title =        "Novel Architectures for Unsupervised Information
                 Bottleneck Based Speaker Diarization of Meetings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "14--27",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Speaker diarization is an important problem that is
                 topical, and is especially useful as a preprocessor for
                 conversational speech related applications. The
                 objective of this article is two-fold: (i) segment
                 initialization by uniformly distributing speaker
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Midia Yousefi and John H. L. Hansen",
  title =        "Block-Based High Performance {CNN} Architectures for
                 Frame-Level Overlapping Speech Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "28--40",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech technology systems such as Automatic Speech
                 Recognition (ASR), speaker diarization, speaker
                 recognition, and speech synthesis have advanced
                 significantly by the emergence of deep learning
                 techniques. However, none of these voice-enabled
                 systems \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiaming Cheng and Ruiyu Liang and Zhenlin Liang and Li
                 Zhao and Chengwei Huang and Bj{\"o}rn Schuller",
  title =        "A Deep Adaptation Network for Speech Enhancement:
                 Combining a Relativistic Discriminator With
                 Multi-Kernel Maximum Mean Discrepancy",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "41--53",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "In deep-learning-based speech enhancement (SE)
                 systems, trained models are often used to handle unseen
                 noise types and language environments in real-life
                 scenarios. However, since production environments
                 differ from training conditions, mismatch problems
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Franz Anders and Mario Hlawitschka and Mirco Fuchs",
  title =        "Comparison of Artificial Neural Network Types for
                 Infant Vocalization Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "54--67",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "In this study we compared various neural network types
                 for the task of automatic infant vocalization
                 classification, i.e convolutional, recurrent and
                 fully-connected networks as well as combinations of
                 thereof. The goal was to first determine the optimal
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tomohiko Nakamura and Hirokazu Kameoka",
  title =        "Harmonic-Temporal Factor Decomposition for
                 Unsupervised Monaural Separation of Harmonic Sounds",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "68--82",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "We address the problem of separating a monaural
                 mixture of harmonic sounds into the audio signals of
                 individual semitones in an unsupervised manner.
                 Unsupervised monaural audio source separation has thus
                 far been mainly addressed by two approaches: one
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jens Ahrens and Stefan Bilbao",
  title =        "Computation of Spherical Harmonic Representations of
                 Source Directivity Based on the Finite-Distance
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "83--92",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "The measurement of directivity for sound sources that
                 are not electroacoustic transducers is fundamentally
                 limited because the source cannot be driven with
                 arbitrary signals. A consequence is that directivity
                 can only be measured at a sparse set of \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shun-Po Chuang and Alexander H. Liu and Tzu-Wei Sung
                 and Hung-yi Lee",
  title =        "Improving Automatic Speech Recognition and Speech
                 Translation via Word Embedding Prediction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "93--105",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "In this article, we target speech translation (ST). We
                 propose lightweight approaches that generally improve
                 either ASR or end-to-end ST models. We leverage
                 continuous representations of words, known as word
                 embeddings, to improve ASR in cascaded systems
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Li Chai and Jun Du and Qing-Feng Liu and Chin-Hui
  title =        "A Cross-Entropy-Guided Measure {(CEGM)} for Assessing
                 Speech Recognition Performance and Optimizing
                 {DNN}-Based Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "106--117",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "A new cross-entropy-guided measure (CEGM) is proposed
                 to indirectly assess accuracies of automatic speech
                 recognition (ASR) of degraded speech with a speech
                 enhancement front-end and without directly performing
                 ASR experiments. The proposed CEGM is \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "De Hu and Zhe Chen and Fuliang Yin",
  title =        "Passive Geometry Calibration for Microphone Arrays
                 Based on Distributed Damped {Newton} Optimization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "118--131",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Geometry calibration is an inherent challenge in
                 distributed acoustic sensor networks. To mitigate this
                 problem, a passive geometry calibration approach based
                 on distributed damped Newton optimization is proposed.
                 Specifically, a geometric cost function \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Berrak Sisman and Junichi Yamagishi and Simon King and
                 Haizhou Li",
  title =        "An Overview of Voice Conversion and Its Challenges:
                 From Statistical Modeling to Deep Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "132--157",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Speaker identity is one of the important
                 characteristics of human speech. In voice conversion,
                 we change the speaker identity from one to another,
                 while keeping the linguistic content unchanged. Voice
                 conversion involves multiple speech processing
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jilu Jin and Gongping Huang and Xuehan Wang and
                 Jingdong Chen and Jacob Benesty and Israel Cohen",
  title =        "Steering Study of Linear Differential Microphone
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "158--170",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Differential microphone arrays (DMAs) can achieve high
                 directivity and frequency-invariant spatial response
                 with small apertures; they also have a great potential
                 to be used in a wide spectrum of applications for
                 high-fidelity sound acquisition. Although \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ching-Hua Lee and Bhaskar D. Rao and Harinath
  title =        "Proportionate Adaptive Filtering Algorithms Derived
                 Using an Iterative Reweighting Framework",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "171--186",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, based on sparsity-promoting
                 regularization techniques from the sparse signal
                 recovery (SSR) area, least mean square (LMS)-type
                 sparse adaptive filtering algorithms are derived. The
                 approach mimics the iterative reweighted \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shakeel Ahmed and Muhammad Tufail and Muhammad Rehan
                 and Tanveer Abbas and Amna Majid",
  title =        "A Novel Approach for Improved Noise Reduction
                 Performance in Feed-Forward Active Noise Control
                 Systems With (Loudspeaker) Saturation Non-Linearity in
                 the Secondary Path",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "187--197",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "In active noise control systems, the performance of
                 the most celebrated filtered-x-least mean square
                 (FxLMS) adaptive algorithm is degraded in the presence
                 of non-linearity in the secondary path. In this
                 article, we propose a novel approach to improve the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Cunhang Fan and Jiangyan Yi and Jianhua Tao and
                 Zhengkun Tian and Bin Liu and Zhengqi Wen",
  title =        "Gated Recurrent Fusion With Joint Training Framework
                 for Robust End-to-End Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "198--209",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "The joint training framework for speech enhancement
                 and recognition methods have obtained quite good
                 performances for robust end-to-end automatic speech
                 recognition (ASR). However, these methods only utilize
                 the enhanced feature as the input of the speech
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Amin Edraki and Wai-Yip Chan and Jesper Jensen and
                 Daniel Fogerty",
  title =        "Speech Intelligibility Prediction Using
                 Spectro-Temporal Modulation Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "210--225",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Spectro-temporal modulations are believed to mediate
                 the analysis of speech sounds in the human primary
                 auditory cortex. Inspired by humans\&\#x2019;
                 robustness in comprehending speech in challenging
                 acoustic environments, we propose an intrusive speech
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Phan Le Son",
  title =        "On the Design of Sparse Arrays With
                 Frequency-Invariant Beam Pattern",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "226--238",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Beamformer performs spatial filtering to preserve the
                 desired signal while suppressing interfering signals
                 and noise arriving from directions other than the
                 direction of interest. However, the beam pattern of the
                 conventional beamformer is dependent on \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dylan Menzies and Philip Coleman and Filippo Maria
  title =        "A Room Compensation Method by Modification of
                 Reverberant Audio Objects",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "239--252",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Conventional channel-based room equalisation can
                 reduce overall colouration caused by the room response,
                 however it cannot separately correct the colouration
                 caused by the late and early parts of the response, or
                 consider the reverberance in the source \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yonggang Hu and Thushara D. Abhayapala and Prasanga N.
  title =        "Multiple Source Direction of Arrival Estimations Using
                 Relative Sound Pressure Based {MUSIC}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "253--264",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Subspace approach of MUSIC (multiple signal
                 classification) has become one of the most popular
                 multi-source direction of arrival (DOA) estimations due
                 to its easy implementation in practice. However, its
                 localization accuracy is vulnerable to noise. This
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Alan Kan and Qinglin Meng",
  title =        "The Temporal Limits Encoder as a Sound Coding Strategy
                 for Bilateral Cochlear Implants",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "265--273",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "The difference in binaural benefit between bilateral
                 cochlear implant (CI) users and normal hearing (NH)
                 listeners has typically been attributed to CI sound
                 coding strategies not encoding the acoustic fine
                 structure (FS) interaural time differences (ITD).
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rui Liu and Berrak Sisman and Feilong Bao and Jichen
                 Yang and Guanglai Gao and Haizhou Li",
  title =        "Exploiting Morphological and Phonological Features to
                 Improve Prosodic Phrasing for {Mongolian} Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "274--285",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Prosodic phrasing is an important factor that affects
                 naturalness and intelligibility in text-to-speech
                 synthesis. Studies show that deep learning techniques
                 improve prosodic phrasing when large text and speech
                 corpus are available. However, for low-. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Fei Ma and Thushara D. Abhayapala and Wen Zhang",
  title =        "Multiple Circular Arrays of Vector Sensors for
                 Real-Time Sound Field Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "286--299",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "This article proposes multiple circular arrays of
                 vector sensors for analyzing the three dimensional
                 sound field. By exploiting the fact that a finite
                 number of spatial basis functions can represent the
                 sound field within a region, the designed arrays
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "David Diaz-Guerra and Antonio Miguel and Jose R.
  title =        "Robust Sound Source Tracking Using {SRP-PHAT} and
                 {$3$D} Convolutional Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "300--311",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "In this article, we present a new single sound source
                 DOA estimation and tracking system based on the
                 well-known SRP-PHAT algorithm and a three-dimensional
                 Convolutional Neural Network. It uses SRP-PHAT power
                 maps as input features of a fully \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Viet Anh Trinh and Michael Mandel",
  title =        "Directly Comparing the Listening Strategies of Humans
                 and Machines",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "312--323",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Automatic speech recognition (ASR) has reached human
                 performance on many clean speech corpora, but it
                 remains worse than human listeners in noisy
                 environments. This paper investigates whether this
                 difference in performance might be due to a difference
                 in \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Leda Sari and Mark Hasegawa-Johnson and Samuel
  title =        "Auxiliary Networks for Joint Speaker Adaptation and
                 Speaker Change Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "324--333",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Speaker adaptation and speaker change detection have
                 both been studied extensively to improve automatic
                 speech recognition (ASR). In many cases, these two
                 problems are investigated separately: speaker change
                 detection is implemented first to obtain single-.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jielong Yang and Xionghu Zhong and Weiguang Chen and
                 Wenwu Wang",
  title =        "Multiple Acoustic Source Localization in Microphone
                 Array Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "334--347",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "The problem of multiple acoustic source localization
                 using observations from a microphone array network is
                 investigated in this article. Multiple source signals
                 are assumed to be window-disjoint-orthogonal (WDO) on
                 the time-frequency (TF) domain and time \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bin Wu and Sakriani Sakti and Jinsong Zhang and
                 Satoshi Nakamura",
  title =        "Tackling Perception Bias in Unsupervised Phoneme
                 Discovery Using {DPGMM-RNN} Hybrid Model and Functional
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "348--362",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "The human perception of phonemes is biased against
                 speech sounds. The lack of correspondence between
                 perceptual phonemes and acoustic signals forms a big
                 challenge in designing unsupervised algorithms to
                 distinguish phonemes from sound. We propose the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Taewoong Lee and Liming Shi and Jesper Kj{\ae}r
                 Nielsen and Mads Gr{\ae}sb{\o}ll Christensen",
  title =        "Fast Generation of Sound Zones Using Variable Span
                 Trade-Off Filters in the {DFT}-Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "363--378",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "The creation of sound zones with frequency-domain
                 variable span trade-off filters (VAST) is investigated
                 herein. Both narrowband and broadband discrete Fourier
                 transform (DFT)-domain VAST approaches are proposed,
                 and we discuss their relationship to the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Maoshen Jia and Yuxuan Wu and Changchun Bao and
                 Christian Ritz",
  title =        "Multi-Source {DOA} Estimation in Reverberant
                 Environments by Jointing Detection and Modeling of
                 Time-Frequency Points",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "379--392",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "In this article, the direction of arrival (DOA)
                 estimation of multiple speech sources in reverberant
                 environments is investigated based on the recording of
                 a soundfield microphone. First, the recordings are
                 analyzed in the time-frequency (T-F) domain to
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wei Xue and Alastair H. Moore and Mike Brookes and
                 Patrick A. Naylor",
  title =        "Speech Enhancement Based on Modulation-Domain
                 Parametric Multichannel {Kalman} Filtering",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "393--405",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Recently we presented a modulation-domain multichannel
                 Kalman filtering (MKF) algorithm for speech
                 enhancement, which jointly exploits the inter-frame
                 modulation-domain temporal evolution of speech and the
                 inter-channel spatial correlation to estimate the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wei Song and Jingjin Guo and Ruiji Fu and Ting Liu and
                 Lizhen Liu",
  title =        "A Knowledge Graph Embedding Approach for Metaphor
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "406--420",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Metaphor is a figure of speech that describes one
                 thing (a target) by mentioning another thing (a source)
                 in a way that is not literally true. Metaphor
                 understanding is an interesting but challenging problem
                 in natural language processing. This paper \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Longbiao Cheng and Xingwei Sun and Dingding Yao and
                 Junfeng Li and Yonghong Yan",
  title =        "Estimation Reliability Function Assisted Sound Source
                 Localization With Enhanced Steering Vector Phase
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "421--435",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "The performance of the traditional
                 direction-of-arrival (DOA) estimation algorithms
                 greatly degrades in noisy and reverberant environments.
                 Recently, deep learning has been applied to sound
                 source localization and provided the substantial
                 improvement in \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wangyang Yu and W. Bastiaan Kleijn",
  title =        "Room Acoustical Parameter Estimation From Room Impulse
                 Responses Using Deep Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "436--447",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "We describe a new method to estimate the geometry of a
                 room and reflection coefficients given room impulse
                 responses. The method utilizes convolutional neural
                 networks to estimate the room geometry and multilayer
                 perceptrons to estimate the reflection \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Miguel Ferrer and Maria de Diego and Gema Pi{\~n}ero
                 and Alberto Gonzalez",
  title =        "Affine Projection Algorithm Over Acoustic Sensor
                 Networks for Active Noise Control",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "448--461",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Acoustic sensor networks (ASNs) are an effective
                 solution to implement active noise control (ANC)
                 systems by using distributed adaptive algorithms. On
                 one hand, ASNs provide scalable systems where the
                 signal processing load is distributed among the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Nico G{\"o}{\ss}ling and Daniel Marquardt and Simon
  title =        "Performance Analysis of the Extended Binaural {MVDR}
                 Beamformer With Partial Noise Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "462--476",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Besides reducing undesired noise sources and limiting
                 speech distortion, another important objective of a
                 binaural noise reduction algorithm is the preservation
                 of the binaural cues of all sound sources in the
                 acoustic scene. In this paper, we consider \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "G{\'a}bor Gosztolya and R{\'o}bert Busa-Fekete",
  title =        "Ensemble Bag-of-Audio-Words Representation Improves
                 Paralinguistic Classification Accuracy",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "477--488",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "A recently introduced, effective feature extraction
                 technique for computational paralinguistics is that of
                 Bag-of-Audio-Words (BoAW), where we cluster the
                 frame-level training vectors, and represent each speech
                 utterance based on the cluster of its \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Alfred Mertins and Marco Maass and Fabrice Katzberg",
  title =        "Room Impulse Response Reshaping and Crosstalk
                 Cancellation Using Convex Optimization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "489--502",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "In this article, a new convex formulation for the
                 acoustic channel-equalization problem is proposed and
                 efficient ways for solving it are presented. Both the
                 alternating direction method of multipliers and a
                 proximal algorithm are studied for \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xuefeng Bai and Pengbo Liu and Yue Zhang",
  title =        "Investigating Typed Syntactic Dependencies for
                 Targeted Sentiment Classification Using Graph Attention
                 Neural Network",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "503--514",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Targeted sentiment classification predicts the
                 sentiment polarity on given target mentions in input
                 texts. Dominant methods employ neural networks for
                 encoding the input sentence and extracting relations
                 between target mentions and their contexts. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bengt J. Borgstr{\"o}m and Michael S. Brandstein",
  title =        "{Speech Enhancement via Attention Masking Network
                 (SEAMNET)}: an End-to-End System for Joint Suppression
                 of Noise and Reverberation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "515--526",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "This paper proposes the Speech Enhancement via
                 Attention Masking Network (SEAMNET), a neural
                 network-based end-to-end single-channel speech
                 enhancement system designed for joint suppression of
                 noise and reverberation. It formalizes an end-to-end
                 network \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Juan M. Miramont and Marcelo A. Colominas and
                 Gast{\'o}n Schlotthauer",
  title =        "Voice Jitter Estimation Using High-Order
                 Synchrosqueezing Operators",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "527--536",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Voice jitter is defined as a random perturbation of
                 the glottal cycle duration which can be useful for
                 voice parametrization and that usually depends on
                 finding fiducial points in this signal. In this paper,
                 a novel application of the Fourier-based high-.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Peidong Wang and Zhuo Chen and DeLiang Wang and Jinyu
                 Li and Yifan Gong",
  title =        "Speaker Separation Using Speaker Inventories and
                 Estimated Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "537--546",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "We propose speaker separation using speaker
                 inventories and estimated speech (SSUSIES), a framework
                 leveraging speaker profiles and estimated speech for
                 speaker separation. SSUSIES contains two methods,
                 speaker separation using speaker inventories (SSUSI)
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sandro Cumani",
  title =        "On the Distribution of Speaker Verification Scores:
                 Generative Models for Unsupervised Calibration",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "547--562",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Speaker verification systems whose outputs can be
                 interpreted as log-likelihood ratios (LLR) allow for
                 cost-effective decisions by comparing the system
                 outputs to application-defined thresholds depending
                 only on prior information. Classifiers often \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yu-Ren Chien and J{\'o}n Gu{\eth}nason",
  title =        "Acoustic Measure of Vocal Strain Based on Glottal
                 Airflow Periodicity",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "563--574",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "In the clinical practice of dysphonia, the effects of
                 treatment are traditionally monitored by a sequence of
                 auditory-perceptual assessments aimed at measuring
                 vocal quality for the patient. Alternatively, acoustic
                 measurement of vocal quality promises to \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xingfa Shen and Xingkun Shao and Quanbo Ge and Lili
  title =        "{RARS}: Recognition of Audio Recording Source Based on
                 Residual Neural Network",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "575--584",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "With the popularity of mobile devices and the
                 emergence of various audio-editing tools, it becomes
                 easier to produce and forge audio files. Many criminals
                 will forge false audio information as evidence.
                 Therefore, audio forensics technology becomes
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Gang Chen and Yang Liu and Huanbo Luan and Meng Zhang
                 and Qun Liu and Maosong Sun",
  title =        "Learning to Generate Explainable Plots for Neural
                 Story Generation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "585--593",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Story generation is an important natural language
                 processing task that aims to generate coherent stories
                 automatically. While the use of neural networks has
                 proven effective in improving story generation, how to
                 learn to generate an explainable high-level \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wenxing Yang and Jacob Benesty and Gongping Huang and
                 Jingdong Chen",
  title =        "A New Class of Differential Beamformers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "594--606",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Differential microphone arrays (DMAs) have been used
                 in a wide range of applications for high-fidelity
                 acoustic signal acquisition and enhancement. In the
                 design of differential beamformers, three of the widely
                 used measures are the directivity factor (DF).
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuki Mitsufuji and Norihiro Takamune and Shoichi
                 Koyama and Hiroshi Saruwatari",
  title =        "Multichannel Blind Source Separation Based on
                 Evanescent-Region-Aware Non-Negative Tensor
                 Factorization in Spherical Harmonic Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "607--617",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "There is growing interest in new audio formats in the
                 context of virtual reality (VR), and higher-order
                 ambisonics (HOA) is preferred for VR systems to
                 transmit recorded scenes owing to its transmission
                 efficiency and its flexibility to work with \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "D{\"o}rte Fischer and Simon Doclo",
  title =        "Robust Constrained {MFMVDR} Filters for Single-Channel
                 Speech Enhancement Based on Spherical Uncertainty Set",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "618--631",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Aiming at exploiting speech correlation across
                 consecutive time-frames in the short-time Fourier
                 transform domain, the multi-frame minimum variance
                 distortionless response (MFMVDR) filter for
                 single-channel speech enhancement has been proposed.
                 The MFMVDR \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xudong Zhao and Jacob Benesty and Jingdong Chen and
                 Gongping Huang",
  title =        "Differential Beamforming From the Beampattern
                 Factorization Perspective",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "632--643",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "Differential beamformers have demonstrated a great
                 potential in forming frequency-invariant beampatterns
                 and achieving high directivity factors. Most
                 conventional approaches design differential beamformers
                 in such a way that their beampatterns resemble a
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuki Kawara and Chenhui Chu and Yuki Arase",
  title =        "Preordering Encoding on Transformer for Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "644--655",
  month =        jan,
  year =         "2021",
  DOI =          "",
  bibdate =      "Thu May 27 17:56:39 MDT 2021",
  bibsource =    "",
  URL =          "",
  abstract =     "The difference in word orders between source and
                 target languages is a serious hurdle for machine
                 translation. Preordering methods, which reorder the
                 words in a source sentence before translation to obtain
                 a similar word ordering with a target language,
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "c1--ix",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "c2--c2",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "Table of Contents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "x--xx",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuki Kawara and Chenhui Chu and Yuki Arase",
  title =        "Preordering Encoding on Transformer for Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "644--655",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hirokazu Kameoka and Wen-Chin Huang and Kou Tanaka and
                 Takuhiro Kaneko and Nobukatsu Hojo and Tomoki Toda",
  title =        "Many-to-Many Voice Transformer Network",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "656--670",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jie Zhang and Huawei Chen and Li-Rong Dai and Richard
                 Christian Hendriks",
  title =        "A Study on Reference Microphone Selection for
                 Multi-Microphone Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "671--683",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Archontis Politis and Annamaria Mesaros and Sharath
                 Adavanne and Toni Heittola and Tuomas Virtanen",
  title =        "Overview and Evaluation of Sound Event Localization
                 and Detection in {DCASE 2019}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "684--698",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Markus Niermann and Peter Vary",
  title =        "Listening Enhancement in Noisy Environments: Solutions
                 in Time and Frequency Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "699--709",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hyeonseung Lee and Woo Hyun Kang and Sung Jun Cheon
                 and Hyeongju Kim and Nam Soo Kim",
  title =        "Gated Recurrent Context: Softmax-Free Attention for
                 Online Encoder-Decoder Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "710--719",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Elizabeth Vargas and James R. Hopgood and Keith Brown
                 and Kartic Subr",
  title =        "On Improved Training of {CNN} for Acoustic Source
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "720--732",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yunqi Cai and Lantian Li and Andrew Abel and Xiaoyan
                 Zhu and Dong Wang",
  title =        "Deep Normalization for Speaker Vectors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "733--744",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wen-Chin Huang and Tomoki Hayashi and Yi-Chiao Wu and
                 Hirokazu Kameoka and Tomoki Toda",
  title =        "Pretraining Techniques for Sequence-to-Sequence Voice
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "745--755",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Arindam Jati and Amrutha Nadarajan and Raghuveer Peri
                 and Karel Mundnich and Tiantian Feng and Benjamin
                 Girault and Shrikanth Narayanan",
  title =        "Temporal Dynamics of Workplace Acoustic Scenes:
                 Egocentric Analysis and Prediction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "756--769",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chaoqun Duan and Kehai Chen and Rui Wang and Masao
                 Utiyama and Eiichiro Sumita and Conghui Zhu and Tiejun
  title =        "Modeling Future Cost for Neural Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "770--781",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kashif Munir and Hai Zhao and Zuchao Li",
  title =        "Adaptive Convolution for Semantic Role Labeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "782--791",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi-Chiao Wu and Tomoki Hayashi and Takuma Okamoto and
                 Hisashi Kawai and Tomoki Toda",
  title =        "Quasi-Periodic Parallel {WaveGAN}: a
                 Non-Autoregressive Raw Waveform Generative Model With
                 Pitch-Dependent Dilated Convolution Neural Network",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "792--806",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Weitao Yuan and Bofei Dong and Shengbei Wang and
                 Masashi Unoki and Wenwu Wang",
  title =        "Evolving Multi-Resolution Pooling {CNN} for Monaural
                 Singing Voice Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "807--822",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Liming Shi and Taewoong Lee and Lijun Zhang and Jesper
                 Kj{\ae}r Nielsen and Mads Gr{\ae}sb{\o}ll Christensen",
  title =        "Generation of Personal Sound Zones With Physical
                 Meaningful Constraints and Conjugate Gradient Method",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "823--837",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xi Chen and Jacob Benesty and Gongping Huang and
                 Jingdong Chen",
  title =        "On the Robustness of the Superdirective Beamformer",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "838--849",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xinsheng Wang and Tingting Qiao and Jihua Zhu and Alan
                 Hanjalic and Odette Scharenborg",
  title =        "Generating Images From Spoken Descriptions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "850--865",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Vevake Balaraman and Bernardo Magnini",
  title =        "Domain-Aware Dialogue State Tracker for Multi-Domain
                 Dialogue Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "866--873",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xixin Wu and Yuewen Cao and Hui Lu and Songxiang Liu
                 and Shiyin Kang and Zhiyong Wu and Xunying Liu and
                 Helen Meng",
  title =        "Exemplar-Based Emotive Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "874--886",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Heinrich Dinkel and Mengyue Wu and Kai Yu",
  title =        "Towards Duration Robust Weakly Supervised Sound Event
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "887--900",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zamir Ben-Hur and David Lou Alon and Ravish Mehra and
                 Boaz Rafaely",
  title =        "Binaural Reproduction Based on Bilateral Ambisonics
                 and Ear-Aligned {HRTFs}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "901--913",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Philipp Aichinger and Franz Pernkopf",
  title =        "Synthesis and Analysis-By-Synthesis of Modulated
                 Diplophonic Glottal Area Waveforms",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "914--926",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Finnian Kelly and John H. L. Hansen",
  title =        "Analysis and Calibration of {Lombard} Effect and
                 Whisper for Speaker Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "927--942",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Matthias M{\"u}ller and Thilo Schulz and Tatiana
                 Ermakova and Philipp P. Caffier",
  title =        "Lyric or Dramatic --- Vibrato Analysis for Voice Type
                 Classification in Professional Opera Singers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "943--955",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dem{\'o}stenes Z. Rodr{\'\i}guez and Dick Carrillo and
                 Miguel A. Ram{\'\i}rez and Pedro H. J. Nardelli and
                 Sebastian M{\"o}ller",
  title =        "Incorporating Wireless Communication Parameters Into
                 the E-Model Algorithm",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "956--968",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tianrui Zong and Yong Xiang and Iynkaran Natgunanathan
                 and Longxiang Gao and Guang Hua and Wanlei Zhou",
  title =        "Non-Linear-Echo Based Anti-Collusion Mechanism for
                 Audio Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "969--984",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zheng Lian and Bin Liu and Jianhua Tao",
  title =        "{CTNet}: Conversational Transformer Network for
                 Emotion Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "985--1000",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiacheng Zhang and Huanbo Luan and Maosong Sun and
                 Feifei Zhai and Jingfang Xu and Yang Liu",
  title =        "Neural Machine Translation With Explicit Phrase
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1001--1010",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Maria Vukovic and Melissa Stolar and Margaret Lech",
  title =        "Cognitive Load Estimation From Speech Commands to
                 Simulated Aircraft",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1011--1022",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "De Hu and Zhe Chen and Fuliang Yin",
  title =        "Geometry Calibration for Acoustic Transceiver Networks
                 Based on Network {Newton} Distributed Optimization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1023--1032",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuki Saito and Shinnosuke Takamichi and Hiroshi
  title =        "Perceptual-Similarity-Aware Deep Speaker
                 Representation Learning for Multi-Speaker Generative
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1033--1048",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tadashi Sakata and Naomitsu Ikeda and Yuichi Ueda and
                 Akira Watanabe",
  title =        "Vocal Tract Length Estimation Using Accumulated Means
                 of Formants and Its Effects on Speaker-Normalization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1049--1064",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jichen Yang and Hongji Wang and Rohan Kumar Das and
                 Yanmin Qian",
  title =        "Modified Magnitude-Phase Spectrum Information for
                 Spoofing Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1065--1078",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yanmin Qian and Zhengyang Chen and Shuai Wang",
  title =        "Audio-Visual Deep Neural Network for Robust Person
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1079--1092",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Peiqin Lin and Meng Yang and Jianhuang Lai",
  title =        "Deep Selective Memory Network With Selective Attention
                 and Inter-Aspect Modeling for Aspect Level Sentiment
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1093--1106",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Herman Kamper and Yevgen Matusevych and Sharon
  title =        "Improved Acoustic Word Embeddings for Zero-Resource
                 Languages Using Multilingual Transfer",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1107--1118",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Weiqing Wang and Jin Pan and Hua Yi and Zhanmei Song
                 and Ming Li",
  title =        "Audio-Based Piano Performance Evaluation for Beginners
                 With Convolutional Neural Network and Attention
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1119--1133",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi-Chiao Wu and Tomoki Hayashi and Patrick Lumban
                 Tobing and Kazuhiro Kobayashi and Tomoki Toda",
  title =        "Quasi-Periodic {WaveNet}: an Autoregressive Raw
                 Waveform Generative Model With Pitch-Dependent Dilated
                 Convolution Neural Network",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1134--1148",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Vesa V{\"a}lim{\"a}ki and Karolina Prawda",
  title =        "Late-Reverberation Synthesis Using Interleaved
                 Velvet-Noise Sequences",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1149--1160",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhuosheng Zhang and Junlong Li and Hai Zhao",
  title =        "Multi-Turn Dialogue Reading Comprehension With Pivot
                 Turns and Knowledge",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1161--1173",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Cl{\'e}ment Gaultier and Sr an {Kiti } and R{\'e}mi
                 Gribonval and Nancy Bertin",
  title =        "Sparsity-Based Audio Declipping Methods: Selected
                 Overview, New Algorithms, and Large-Scale Evaluation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1174--1187",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lachlan Birnie and Thushara Abhayapala and Vladimir
                 Tourbabin and Prasanga Samarasinghe",
  title =        "Mixed Source Sound Field Translation for Virtual
                 Binaural Application With Perceptual Validation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1188--1203",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Monisankha Pal and Manoj Kumar and Raghuveer Peri and
                 Tae Jin Park and So Hyun Kim and Catherine Lord and
                 Somer Bishop and Shrikanth Narayanan",
  title =        "Meta-Learning With Latent Space Clustering in
                 Generative Adversarial Network for Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1204--1219",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jie Zhang and Jun Du and Li-Rong Dai",
  title =        "Sensor Selection for Relative Acoustic Transfer
                 Function Steered Linearly-Constrained Beamformers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1220--1232",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Huang Xie and Tuomas Virtanen",
  title =        "Zero-Shot Audio Classification Via Semantic
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1233--1242",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xianhong Chen and Changchun Bao",
  title =        "Phoneme-Unit-Specific Time-Delay Neural Network for
                 Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1243--1255",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dongyuan Shi and Woon-Seng Gan and Bhan Lam and Shulin
                 Wen and Xiaoyi Shen",
  title =        "Optimal Output-Constrained Active Noise Control Based
                 on Inverse Adaptive Modeling Leak Factor Estimate",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1256--1269",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ashutosh Pandey and DeLiang Wang",
  title =        "Dense {CNN} With Self-Attention for Time-Domain Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1270--1279",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Libo Qin and Wanxiang Che and Minheng Ni and Yangming
                 Li and Ting Liu",
  title =        "Knowing Where to Leverage: Context-Aware Graph
                 Convolutional Network With an Adaptive Fusion Layer for
                 Contextual Spoken Language Understanding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1280--1289",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mingyang Zhang and Yi Zhou and Li Zhao and Haizhou
  title =        "Transfer Learning From Speech Synthesis to Voice
                 Conversion With Non-Parallel Training Data",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1290--1302",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Weipeng He and Petr Motlicek and Jean-Marc Odobez",
  title =        "Neural Network Adaptation and Data Augmentation for
                 Multi-Speaker Direction-of-Arrival Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1303--1317",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yile Wang and Leyang Cui and Yue Zhang",
  title =        "Improving Skip-Gram Embeddings Using {BERT}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1318--1328",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Linzhi Wu and Meishan Zhang",
  title =        "Deep Graph-Based Character-Level {Chinese} Dependency
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1329--1339",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ye Bai and Jiangyan Yi and Jianhua Tao and Zhengqi Wen
                 and Zhengkun Tian and Shuai Zhang",
  title =        "Integrating Knowledge Into End-to-End Speech
                 Recognition From External Text-Only Data",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1340--1351",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Byung Joon Cho and Hyung-Min Park",
  title =        "Convolutional Maximum-Likelihood Distortionless
                 Response Beamforming With Steering Vector Estimation
                 for Robust Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1352--1367",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Daniel Michelsanti and Zheng-Hua Tan and Shi-Xiong
                 Zhang and Yong Xu and Meng Yu and Dong Yu and Jesper
  title =        "An Overview of Deep-Learning-Based Audio-Visual Speech
                 Enhancement and Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1368--1396",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Gal Itzhak and Jacob Benesty and Israel Cohen",
  title =        "On the Design of Differential {Kronecker} Product
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1397--1410",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhongshu Ge and Liang Li and Tianshu Qu",
  title =        "Partially Matching Projection Decoding Method
                 Evaluation Under Different Playback Conditions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1411--1423",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sijie Mai and Songlong Xing and Haifeng Hu",
  title =        "Analyzing Multimodal Sentiment Via Acoustic- and
                 Visual-{LSTM} With Channel-Aware Temporal Convolution
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1424--1437",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tao Qian and Meishan Zhang and Yinxia Lou and Daiwen
  title =        "A Joint Model for Named Entity Recognition With
                 Sentence-Level Entity Type Attentions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1438--1448",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ryotaro Sato and Kenta Niwa and Kazunori Kobayashi",
  title =        "Ambisonic Signal Processing {DNNs} Guaranteeing
                 Rotation, Scale and Time Translation Equivariance",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1449--1462",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sooyeon Park and Jung-Woo Choi",
  title =        "Iterative Echo Labeling Algorithm With Convex Hull
                 Expansion for Room Geometry Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1463--1478",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Aidan O. T. Hogg and Christine Evers and Alastair H.
                 Moore and Patrick A. Naylor",
  title =        "Overlapping Speaker Segmentation Using Multiple
                 Hypothesis Tracking of Fundamental Frequency",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1479--1490",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rajib Sharma and Israel Cohen and Baruch Berdugo",
  title =        "Controlling Elevation and Azimuth Beamwidths With
                 Concentric Circular Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1491--1502",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Run-Ze Wang and Zhen-Hua Ling and Jing-Bo Zhou and Yu
  title =        "A Multiple-Integration Encoder for Multi-Turn
                 Text-to-{SQL} Semantic Parsing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1503--1513",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shoukang Hu and Xurong Xie and Shansong Liu and
                 Jianwei Yu and Zi Ye and Mengzhe Geng and Xunying Liu
                 and Helen Meng",
  title =        "{Bayesian} Learning of {LF-MMI} Trained Time Delay
                 Neural Networks for Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1514--1529",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Matteo Torcoli and Thorsten Kastner and J{\"u}rgen
  title =        "Objective Measures of Perceptual Audio Quality
                 Reviewed: an Evaluation of Their Application Domain
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1530--1541",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Heinrich Dinkel and Shuai Wang and Xuenan Xu and
                 Mengyue Wu and Kai Yu",
  title =        "Voice Activity Detection in the Wild: a Data-Driven
                 Approach Using Teacher-Student Training",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1542--1555",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Songbin Li and Jingang Wang and Peng Liu and Miao Wei
                 and Qiandong Yan",
  title =        "Detection of Multiple Steganography Methods in
                 Compressed Speech Based on Code Element Embedding,
                 {Bi-LSTM} and {CNN} With Attention Mechanisms",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1556--1569",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qianli Ma and Jiangyue Yan and Zhenxi Lin and Liuhong
                 Yu and Zipeng Chen",
  title =        "Deformable Self-Attention for Text Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1570--1581",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ya-Jie Zhang and Zhen-Hua Ling",
  title =        "Extracting and Predicting Word-Level Style Variations
                 for Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1582--1593",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Alexander Bohlender and Ann Spriet and Wouter Tirry
                 and Nilesh Madhu",
  title =        "Exploiting Temporal Context in {CNN} Based Multisource
                 {DOA} Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1594--1608",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kohei Yatabe and Daichi Kitamura",
  title =        "Determined {BSS} Based on Time-Frequency Masking and
                 Its Application to Harmonic Vector Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1609--1625",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ji Won Yoon and Hyeonseung Lee and Hyung Yong Kim and
                 Won Ik Cho and Nam Soo Kim",
  title =        "{TutorNet}: Towards Flexible Knowledge Distillation
                 for End-to-End Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1626--1638",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Prachi Singh and Sriram Ganapathy",
  title =        "Self-Supervised Representation Learning With Path
                 Integral Clustering for Speaker Diarization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1639--1649",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Penghui Wei and Jiahao Zhao and Wenji Mao",
  title =        "A Graph-to-Sequence Learning Framework for Summarizing
                 Opinionated Texts",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1650--1660",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dovid Y. Levin and Shmulik Markovich-Golan and Sharon
  title =        "Near-Field Superdirectivity: an Analytical
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1661--1674",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jia-Hao Hsu and Ming-Hsiang Su and Chung-Hsien Wu and
                 Yi-Hsuan Chen",
  title =        "Speech Emotion Recognition Considering Nonverbal
                 Vocalization in Affective Conversations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1675--1686",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tomohiko Nakamura and Shihori Kozuka and Hiroshi
  title =        "Time-Domain Audio Source Separation With Neural
                 Networks Based on Multiresolution Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1687--1701",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yun Zhang and Yongguo Liu and Jiajing Zhu and Xindong
  title =        "{FSPRM}: a Feature Subsequence Based Probability
                 Representation Model for {Chinese} Word Embedding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1702--1716",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Songxiang Liu and Yuewen Cao and Disong Wang and Xixin
                 Wu and Xunying Liu and Helen Meng",
  title =        "Any-to-Many Voice Conversion With Location-Relative
                 Sequence-to-Sequence Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1717--1728",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rafael A. Chiea and M{\'a}rcio H. Costa and J{\'u}lio
                 A. Cordioli",
  title =        "An Optimal Envelope-Based Noise Reduction Method for
                 Cochlear Implants: an Upper Bound Performance
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1729--1739",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Junliang Guo and Zhirui Zhang and Linli Xu and Boxing
                 Chen and Enhong Chen",
  title =        "Adaptive Adapters: an Efficient Way to Incorporate
                 {BERT} Into Neural Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1740--1751",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi Luo and Cong Han and Nima Mesgarani",
  title =        "Group Communication With Context Codec for Lightweight
                 Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1752--1761",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhiwen Xie and Runjie Zhu and Jin Liu and Guangyou
                 Zhou and Jimmy Xiangji Huang",
  title =        "Hierarchical Neighbor Propagation With Bidirectional
                 Graph Attention Network for Relation Prediction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1762--1773",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xuehan Wang and Jacob Benesty and Jingdong Chen and
                 Gongping Huang and Israel Cohen",
  title =        "Beamforming with Cube Microphone Arrays Via
                 {Kronecker} Product Decompositions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1774--1784",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ke Tan and DeLiang Wang",
  title =        "Towards Model Compression for Deep Learning Based
                 Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1785--1794",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kristina Tesch and Timo Gerkmann",
  title =        "Nonlinear Spatial Filtering in Multichannel Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1795--1805",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rui Liu and Berrak Sisman and Guanglai Gao and Haizhou
  title =        "Expressive {TTS} Training With Frame and Style
                 Reconstruction Loss",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1806--1818",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jipeng Qiang and Xinyu Lu and Yun Li and Yunhao Yuan
                 and Xindong Wu",
  title =        "{Chinese} Lexical Simplification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1819--1828",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Andong Li and Wenzhe Liu and Chengshi Zheng and
                 Cunhang Fan and Xiaodong Li",
  title =        "Two Heads are Better Than One: a Two-Stage Complex
                 Spectral Mapping Approach for Monaural Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1829--1843",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Eric C. Hamdan and Filippo Maria Fazi",
  title =        "Weighted Orthogonal Vector Rejection Method for
                 Loudspeaker-Based Binaural Audio Reproduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1844--1852",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ke Tan and Xueliang Zhang and DeLiang Wang",
  title =        "Deep Learning Based Real-Time Speech Enhancement for
                 Dual-Microphone Mobile Phones",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1853--1863",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kunkun SongGong and Huawei Chen and Wenwu Wang",
  title =        "Indoor Multi-Speaker Localization Based on {Bayesian}
                 Nonparametrics in the Circular Harmonic Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1864--1880",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Aleksej Chinaev and Philipp Th{\"u}ne and Gerald
  title =        "Double-Cross-Correlation Processing for Blind
                 Sampling-Rate and Time-Offset Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1881--1896",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ye Bai and Jiangyan Yi and Jianhua Tao and Zhengkun
                 Tian and Zhengqi Wen and Shuai Zhang",
  title =        "Fast End-to-End Speech Recognition Via
                 Non-Autoregressive Models and Cross-Modal Knowledge
                 Transferring From {BERT}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1897--1911",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "{\"O}yk{\"u} Deniz K{\"o}se and Murat Sara{\c{c}}lar",
  title =        "Multimodal Representations for Synchronized Speech and
                 Real-Time {MRI} Video Processing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1912--1924",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "N. P. Narendra and Bj{\"o}rn Schuller and Paavo Alku",
  title =        "The Detection of {Parkinson}'s Disease From Speech
                 Using Voice Source Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1925--1936",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Robert Rehr and Timo Gerkmann",
  title =        "{SNR-Based} Features and Diverse Training Data for
                 Robust {DNN-Based} Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1937--1949",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Nobutaka Ito and Rintaro Ikeshita and Hiroshi Sawada
                 and Tomohiro Nakatani",
  title =        "A Joint Diagonalization Based Efficient Approach to
                 Underdetermined Blind Audio Source Separation Using the
                 Multichannel {Wiener} Filter",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1950--1965",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hao Fei and Shengqiong Wu and Yafeng Ren and Donghong
  title =        "Second-Order Semantic Role Labeling With Global
                 Structural Refinement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1966--1976",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Humberto M. Torres and Mercedes G{\"u}emes and Jorge
                 A. Gurlekian and Diego A. Evin",
  title =        "{F0} Perturbation Due to Articulatory Movements:
                 Filtering, Characterization and Applications",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1977--1986",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Khaled Koutini and Hamid Eghbal-zadeh and Gerhard
  title =        "Receptive Field Regularization Techniques for Audio
                 Classification and Tagging With Deep Convolutional
                 Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "1987--2000",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhong-Qiu Wang and Peidong Wang and DeLiang Wang",
  title =        "Multi-microphone Complex Spectral Mapping for
                 Utterance-wise and Continuous Speech Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2001--2014",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mengjia Zhou and Donghong Ji and Fei Li",
  title =        "Relation Extraction in Dialogues: a Deep Learning
                 Model Based on the Generality and Specialty of Dialogue
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2015--2026",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Minh Nguyen and Gia H. Ngo and Nancy F. Chen",
  title =        "Domain-Shift Conditioning Using Adaptable Filtering
                 Via Hierarchical Embeddings for Robust {Chinese} Spell
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2027--2036",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lior Madmoni and Shir Tibor and Israel Nelken and Boaz
  title =        "The Effect of Partial Time-Frequency Masking of the
                 Direct Sound on the Perception of Reverberant Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2037--2047",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Haibin Chen and Qianli Ma and Liuhong Yu and Zhenxi
                 Lin and Jiangyue Yan",
  title =        "Corpus-Aware Graph Aggregation Network for Sequence
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2048--2057",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Heming Wang and DeLiang Wang",
  title =        "Towards Robust Speech Super-Resolution",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2058--2066",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jianwei Yu and Shi-Xiong Zhang and Bo Wu and Shansong
                 Liu and Shoukang Hu and Mengzhe Geng and Xunying Liu
                 and Helen Meng and Dong Yu",
  title =        "Audio-Visual Multi-Channel Integration and Recognition
                 of Overlapped Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2067--2082",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Olga Slizovskaia and Gloria Haro and Emilia
  title =        "Conditioned Source Separation for Musical Instrument
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2083--2095",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xurong Xie and Xunying Liu and Tan Lee and Lan Wang",
  title =        "{Bayesian} Learning for Deep Neural Network
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2096--2110",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sankha Subhra Bhattacharjee and Nithin V. George",
  title =        "Nearest {Kronecker} Product Decomposition Based
                 Linear-in-The-Parameters Nonlinear Filters",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2111--2122",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Canguang Li and Guohua Wang and Jin Cao and Yi Cai",
  title =        "A Multi-Agent Communication Based Model for Nested
                 Named Entity Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2123--2136",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jonah Ong and Ba Tuong Vo and Sven Nordholm",
  title =        "Blind Separation for Multiple Moving Sources With
                 Labeled Random Finite Sets",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2137--2151",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yixuan Su and Yan Wang and Deng Cai and Simon Baker
                 and Anna Korhonen and Nigel Collier",
  title =        "{PROTOTYPE-TO-STYLE}: Dialogue Generation With
                 Style-Aware Editing on Retrieval Memory",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2152--2161",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Alberto Bernardini and Enrico Bozzo and Federico
                 Fontana and Augusto Sarti",
  title =        "A Wave Digital {Newton--Raphson} Method for Virtual
                 Analog Modeling of Audio Circuits with Multiple
                 One-Port Nonlinearities",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2162--2173",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Gang Guo and Yi Yu and Rodrigo C. de Lamare and
                 Zongsheng Zheng and Lu Lu and Qiangming Cai",
  title =        "Proximal Normalized Subband Adaptive Filtering for
                 Acoustic Echo Cancellation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2174--2188",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Juho Liski and Aki M{\"a}kivirta and Vesa
  title =        "Audibility of Group-Delay Equalization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2189--2201",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Farjana Sultana Mim and Naoya Inoue and Paul Reisert
                 and Hiroki Ouchi and Kentaro Inui",
  title =        "Corruption Is Not All Bad: Incorporating Discourse
                 Structure Into Pre-Training via Corruption for Essay
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2202--2215",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dror Kipnis and Roee Diamant",
  title =        "Graph-Based Clustering of Dolphin Whistles",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2216--2227",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuanyuan Liu and Nelly Penttil{\"a} and Tiina
                 Ihalainen and Juulia Lintula and Rachel Convey and Okko
  title =        "Language-Independent Approach for Automatic
                 Computation of Vowel Articulation Features in
                 Dysarthric Speech Assessment",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2228--2243",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "C. Medina and R. Coelho and L. Z{\~a}o",
  title =        "Impulsive Noise Detection for Speech Enhancement in
                 {HHT} Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2244--2253",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Iv{\'a}n L{\'o}pez-Espejo and Zheng-Hua Tan and Jesper
  title =        "A Novel Loss Function and Training Strategy for
                 Noise-Robust Keyword Spotting",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2254--2266",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shansong Liu and Mengzhe Geng and Shoukang Hu and
                 Xurong Xie and Mingyu Cui and Jianwei Yu and Xunying
                 Liu and Helen Meng",
  title =        "Recent Progress in the {CUHK} Dysarthric Speech
                 Recognition System",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2267--2281",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Juan Zhao and Tianrui Zong and Yong Xiang and
                 Longxiang Gao and Wanlei Zhou and Gleb Beliakov",
  title =        "Desynchronization Attacks Resilient Watermarking
                 Method Based on Frequency Singular Value Coefficient
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2282--2295",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mert Burkay {\c{C}}{\"o}teli and H{\"u}seyin
  title =        "Sparse Representations With {Legendre} Kernels for
                 {DOA} Estimation and Acoustic Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2296--2309",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Nicolas Furnon and Romain Serizel and Slim Essid and
                 Irina Illina",
  title =        "{DNN}-Based Mask Estimation for Distributed Speech
                 Enhancement in Spatially Unconstrained Microphone
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2310--2323",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Or Haim Anidjar and Itshak Lapidot and Chen Hajaj and
                 Amit Dvir and Issachar Gilad",
  title =        "Hybrid Speech and Text Analysis Methods for Speaker
                 Change Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2324--2338",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chuang Fan and Chaofa Yuan and Lin Gui and Yue Zhang
                 and Ruifeng Xu",
  title =        "Multi-Task Sequence Tagging for Emotion-Cause Pair
                 Extraction Via Tag Distribution Refinement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2339--2350",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Andy T. Liu and Shang-Wen Li and Hung-yi Lee",
  title =        "{TERA}: Self-Supervised Learning of Transformer
                 Encoder Representation for Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2351--2366",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Guanlong Zhao and Shaojin Ding and Ricardo
  title =        "Converting Foreign Accent Speech Without a Reference",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2367--2381",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kilian Schulze-Forster and Clement S. J. Doire and
                 Ga{\"e}l Richard and Roland Badeau",
  title =        "Phoneme Level Lyrics Alignment and Text-Informed
                 Singing Voice Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2382--2395",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shengqiong Wu and Hao Fei and Yafeng Ren and Bobo Li
                 and Fei Li and Donghong Ji",
  title =        "High-Order Pair-Wise Aspect and Opinion Terms
                 Extraction With Edge-Enhanced Syntactic Graph
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2396--2406",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jingyi Wu and Lin Shang and Xiaoying Gao",
  title =        "Sentiment Time Series Calibration for Event
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2407--2420",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kashif Munir and Hai Zhao and Zuchao Li",
  title =        "Learning Context-Aware Convolutional Filters for
                 Implicit Discourse Relation Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2421--2433",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Seokhwan Kim and Hannes Schulz and Chulaka Gunasekara
                 and Chiori Hori and Abhinav Rastogi and Luis Fernando
                 D. Haro",
  title =        "Editorial: Special Issue on the Eighth Dialog System
                 Technology Challenge",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2434--2436",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Byoungjae Kim and Jungyun Seo and Myoung-Wan Koo",
  title =        "Randomly Wired Network Based on {RoBERTa} and Dialog
                 History Attention for Response Selection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2437--2442",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jia-Chen Gu and Tianda Li and Zhen-Hua Ling and Quan
                 Liu and Zhiming Su and Yu-Ping Ruan and Xiaodan Zhu",
  title =        "Deep Contextualized Utterance Representations for
                 Response Selection and Dialogue Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2443--2455",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yun-Wei Chu and Kuan-Yen Lin and Chao-Chun Hsu and
                 Lun-Wei Ku",
  title =        "End-to-End Recurrent Cross-Modality Attention for
                 Video Dialogue",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2456--2464",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kun Xu and Han Wu and Linfeng Song and Haisong Zhang
                 and Linqi Song and Dong Yu",
  title =        "Conversational Semantic Role Labeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2465--2475",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zekang Li and Zongjia Li and Jinchao Zhang and Yang
                 Feng and Jie Zhou",
  title =        "Bridging Text and Video: a Universal Multimodal
                 Transformer for Audio-Visual Scene-Aware Dialog",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2476--2483",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Igor Shalyminov and Alessandro Sordoni and Adam
                 Atkinson and Hannes Schulz",
  title =        "{GRTr}: Generative-Retrieval Transformers for
                 Data-Efficient Dialogue Domain Adaptation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2484--2492",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiali Zeng and Yongjing Yin and Yang Liu and Yubin Ge
                 and Jinsong Su",
  title =        "Domain Adaptive Meta-Learning for Dialogue State
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2493--2501",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chen Zhang and Grandee Lee and Luis Fernando D. Haro
                 and Haizhou Li",
  title =        "{D-Score}: Holistic Dialogue Evaluation Without
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2502--2516",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shrikant Malviya and Rohit Mishra and Santosh Kumar
                 Barnwal and Uma Shanker Tiwary",
  title =        "{HDRS}: {Hindi} Dialogue Restaurant Search Corpus for
                 Dialogue State Tracking in Task-Oriented Environment",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2517--2528",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Seokhwan Kim and Michel Galley and Chulaka Gunasekara
                 and Sungjin Lee and Adam Atkinson and Baolin Peng and
                 Hannes Schulz and Jianfeng Gao and Jinchao Li and
                 Mahmoud Adada and Minlie Huang and Luis Lastras and
                 Jonathan K. Kummerfeld and Walter S. Lasecki and Chiori
                 Hori and Anoop Cherian and Tim K. Marks and Abhinav
                 Rastogi and Xiaoxue Zang and Srinivas Sunkara and
                 Raghav Gupta",
  title =        "Overview of the {Eighth Dialog System Technology
                 Challenge: DSTC8}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2529--2540",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Myeongho Jeong and Seungtaek Choi and Jinyoung Yeo and
                 Seung-won Hwang",
  title =        "Label and Context Augmentation for Response Selection
                 at {DSTC8}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2541--2550",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qing Liu and Lei Chen and Yuan Yuan and Huarui Wu",
  title =        "History Reuse and Bag-of-Words Loss for Long Summary
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2551--2560",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lu Zhang and Mingjiang Wang and Qiquan Zhang and
                 Xinsheng Wang and Ming Liu",
  title =        "{PhaseDCN}: a Phase-Enhanced Dual-Path Dilated
                 Convolutional Network for Single-Channel Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2561--2574",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kazi Nazmul Haque and Rajib Rana and Jiajun Liu and
                 John H. L. Hansen and Nicholas Cummins and Carlos Busso
                 and Bj{\"o}rn W. Schuller",
  title =        "Guided Generative Adversarial Neural Network for
                 Representation Learning and Audio Generation Using
                 Fewer Labelled Audio Data",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2575--2590",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Toru Nakashika and Kohei Yatabe",
  title =        "Gamma {Boltzmann} Machine for Audio Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2591--2605",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xintong Li and Lemao Liu and Zhaopeng Tu and Guanlin
                 Li and Shuming Shi and Max Q.-H. Meng",
  title =        "Attending From Foresight: a Novel Attention Mechanism
                 for Neural Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2606--2616",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hengshun Zhou and Jun Du and Yuanyuan Zhang and Qing
                 Wang and Qing-Feng Liu and Chin-Hui Lee",
  title =        "Information Fusion in Attention Networks Using
                 Adaptive and Multi-Level Factorized Bilinear Pooling
                 for Audio-Visual Emotion Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2617--2629",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuling Li and Kui Yu and Yuhong Zhang",
  title =        "Learning Cross-Lingual Mappings in Imperfectly
                 Isomorphic Embedding Spaces",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2630--2642",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiao Zhou and Zhen-Hua Ling and Li-Rong Dai",
  title =        "{UnitNet}: a Sequence-to-Sequence Acoustic Model for
                 Concatenative Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2643--2655",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zihan Pan and Malu Zhang and Jibin Wu and Jiadong Wang
                 and Haizhou Li",
  title =        "Multi-Tone Phase Coding of Interaural Time Difference
                 for Sound Source Localization With Spiking Neural
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2656--2670",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ken {O Hanlon} and Mark B. Sandler",
  title =        "{FifthNet}: Structured Compact Neural Networks for
                 Automatic Chord Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2671--2682",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Simone Spagnol and Riccardo Miccini and Marius George
                 Onofrei and Runar Unnthorsson and Stefania Serafin",
  title =        "Estimation of Spectral Notches From Pinna Meshes:
                 Insights From a Simple Computational Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2683--2695",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chenglin Xu and Wei Rao and Jibin Wu and Haizhou Li",
  title =        "Target Speaker Verification With Selective Auditory
                 Attention for Single and Multi-Talker Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2696--2709",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Adel Zahedi and Michael Syskind Pedersen and Jan
                 {\O}stergaard and Thomas Ulrich Christiansen and Lars
                 Bramsl{\o}w and Jesper Jensen",
  title =        "Minimum Processing Beamforming",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2710--2724",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xianghui Wang and Jie Chen and Xiaoyi Chen and Jing
                 Guo and Qian Xiang",
  title =        "Multichannel Iterative Noise Reduction Filters in the
                 Short-Time-Fourier-Transform Domain Based on
                 {Kronecker} Product Decomposition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2725--2740",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kai-Li Yin and Yi-Fei Pu and Lu Lu",
  title =        "Robust {Q}-Gradient Subband Adaptive Filter for
                 Nonlinear Active Noise Control",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2741--2752",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jaeuk Byun and Jong Won Shin",
  title =        "Monaural Speech Separation Using Speaker Embedding
                 From Preliminary Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2753--2763",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xudong Zhao and Gongping Huang and Jingdong Chen and
                 Jacob Benesty",
  title =        "On the Design of {3D} Steerable Beamformers With
                 Uniform Concentric Circular Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2764--2778",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zifeng Cheng and Zhiwei Jiang and Yafeng Yin and Na Li
                 and Qing Gu",
  title =        "A Unified Target-Oriented Sequence-to-Sequence Model
                 for Emotion-Cause Pair Extraction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2779--2791",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hamid Azadi and Mohammad-R. Akbarzadeh-T and Hamid-R.
                 Kobravi and Ali Shoeibi",
  title =        "Robust Voice Feature Selection Using Interval Type-2
                 Fuzzy {AHP} for Automated Diagnosis of {Parkinson}'s
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2792--2802",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yukiya Hono and Kei Hashimoto and Keiichiro Oura and
                 Yoshihiko Nankaku and Keiichi Tokuda",
  title =        "Sinsy: a Deep Neural Network-Based Singing Voice
                 Synthesis System",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2803--2815",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jian Tang and Jie Zhang and Yan Song and Ian
                 McLoughlin and Li-Rong Dai",
  title =        "Multi-Granularity Sequence Alignment Mapping for
                 Encoder-Decoder Based End-to-End {ASR}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2816--2828",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chongman Leong and Xuebo Liu and Derek F. Wong and
                 Lidia S. Chao",
  title =        "Exploiting Translation Model for Parallel Corpus
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2829--2839",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Neil Zeghidour and David Grangier",
  title =        "{Wavesplit}: End-to-End Speech Separation by Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2840--2849",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dino Oglic and Zoran Cvetkovic and Peter Sollich",
  title =        "Learning Waveform-Based Acoustic Models Using Deep
                 Variational Convolutional Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2850--2863",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Alexandru Nelus and Rainer Martin",
  title =        "Privacy-Preserving Audio Classification Using
                 Variational Information Feature Extraction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2864--2877",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hao Li and DeLiang Wang and Xueliang Zhang and
                 Guanglai Gao",
  title =        "Recurrent Neural Networks and Acoustic Features for
                 Frame-Level Signal-to-Noise Ratio Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2878--2887",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi Zhou and Xiaoqing Zheng and Xuanjing Huang",
  title =        "Generating Responses With a Given Syntactic Pattern in
                 {Chinese} Dialogues",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2888--2898",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Viktor Gunnarsson and Mikael Sternad",
  title =        "Binaural Auralization of Microphone Array Room Impulse
                 Responses Using Causal {Wiener} Filtering",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2899--2914",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zuolong Chen and Huawei Chen and Quansheng Tu",
  title =        "Sensor Imperfection Tolerance Analysis of Robust
                 Linear Differential Microphone Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2915--2929",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yusheng Su and Xu Han and Yankai Lin and Zhengyan
                 Zhang and Zhiyuan Liu and Peng Li and Jie Zhou and
                 Maosong Sun",
  title =        "{CSS-LM}: a Contrastive Framework for Semi-Supervised
                 Fine-Tuning of Pre-Trained Language Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2930--2941",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tobias Kabzinski and Peter Jax",
  title =        "A Causality-Constrained Frequency-Domain Least-Squares
                 Filter Design Method for Crosstalk Cancellation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2942--2956",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Frank Zalkow and Meinard M{\"u}ller",
  title =        "{CTC-Based} Learning of Chroma Features for Score
                 Audio Music Retrieval",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2957--2971",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Teck Kai Chan and Cheng Siong Chin",
  title =        "Multi-Branch Convolutional Macaron net for Sound Event
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2972--2985",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tedd Kourkounakis and Amirhossein Hajavi and Ali
  title =        "{FluentNet}: End-to-End Detection of Stuttered Speech
                 Disfluencies With Deep Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "2986--2999",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Haoyu Li and Junichi Yamagishi",
  title =        "Multi-Metric Optimization Using Generative Adversarial
                 Networks for Near-End Speech Intelligibility
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3000--3011",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zehao Lin and Shaobo Cui and Guodun Li and Xiaoming
                 Kang and Feng Ji and Fenglin Li and Zhongzhou Zhao and
                 Haiqing Chen and Yin Zhang",
  title =        "Predict-Then-Decide: a Predictive Approach for Wait or
                 Answer Task in Dialogue Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3012--3024",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Metin Calis and Steven van de Par and Richard Heusdens
                 and Richard Christian Hendriks",
  title =        "Localization Based on Enhanced Low Frequency
                 Interaural Level Difference",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3025--3039",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Christopher Liberatore",
  title =        "Native-Nonnative Voice Conversion by Residual Warping
                 in a Sparse, Anchor-Based Representation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3040--3051",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shoichi Koyama and Jesper Brunnstr{\"o}m and Hayato
                 Ito and Natsuki Ueno and Hiroshi Saruwatari",
  title =        "Spatial Active Noise Control Based on Kernel
                 Interpolation of Sound Field",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3052--3063",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jipeng Qiang and Yun Li and Yi Zhu and Yunhao Yuan and
                 Yang Shi and Xindong Wu",
  title =        "{LSBert}: Lexical Simplification Based on {BERT}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3064--3076",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ningyu Zhang and Hongbin Ye and Shumin Deng and
                 Chuanqi Tan and Mosha Chen and Songfang Huang and Fei
                 Huang and Huajun Chen",
  title =        "Contrastive Information Extraction With Generative
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3077--3088",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jianyu Wang and Shanzheng Guan and Shupei Liu and
                 Xiao-Lei Zhang",
  title =        "Minimum-Volume Multichannel Nonnegative Matrix
                 Factorization for Blind Audio Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3089--3103",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Alberto Carini and Stefania Cecchi and Alessandro
                 Terenzi and Simone Orcioni",
  title =        "A Room Impulse Response Measurement Method Robust
                 Towards Nonlinearities Based on Orthogonal Periodic
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3104--3117",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jie Zhang and Changheng Li",
  title =        "Quantization-Aware Binaural {MWF} Based Noise
                 Reduction Incorporating External Wireless Devices",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3118--3131",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Biru Zhu and Xingyao Zhang and Ming Gu and Yangdong
  title =        "Knowledge Enhanced Fact Checking and Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3132--3143",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mark A. Poletti and Paul D. Teal",
  title =        "A Superfast {Toeplitz} Matrix Inversion Method for
                 Single- and Multi-Channel Inverse Filters and Its
                 Application to Room Equalization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3144--3157",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Guanlin Li and Lemao Liu and Conghui Zhu and Rui Wang
                 and Tiejun Zhao and Shuming Shi",
  title =        "Detecting Source Contextual Barriers for Understanding
                 Neural Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3158--3169",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chia-Chih Kuo and Kuan-Yu Chen and Shang-Bao Luo",
  title =        "Audio-Aware Spoken Multiple-Choice Question Answering
                 With Pre-Trained Language Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3170--3179",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rui Liu and Zheng Lin and Weiping Wang",
  title =        "Addressing Extraction and Generation Separately:
                 Keyphrase Prediction With Pre-Trained Language Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3180--3191",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiangnan Li and Hongliang Pan and Zheng Lin and Peng
                 Fu and Weiping Wang",
  title =        "Sarcasm Detection with Commonsense Knowledge",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3192--3201",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Runyan Yang and Gaofeng Cheng and Haoran Miao and Ta
                 Li and Pengyuan Zhang and Yonghong Yan",
  title =        "Keyword Search Using Attention-Based End-to-End {ASR}
                 and Frame-Synchronous Phoneme Alignments",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3202--3215",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tareq Alkhaldi and Chenhui Chu and Sadao Kurohashi",
  title =        "Flexibly Focusing on Supporting Facts, Using Bridge
                 Links, and Jointly Training Specialized Modules for
                 Multi-Hop Question Answering",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3216--3225",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wenyi Wu and Yegui Xiao and Jianhui Lin and Liying Ma
                 and Khashayar Khorasani",
  title =        "An Efficient Filter Bank Structure for Adaptive Notch
                 Filtering and Applications",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3226--3241",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xinsheng Wang and Justin van der Hout and Jihua Zhu
                 and Mark Hasegawa-Johnson and Odette Scharenborg",
  title =        "Synthesizing Spoken Descriptions of Images",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3242--3254",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Vincent W. Neo and Christine Evers and Patrick A.
  title =        "Enhancement of Noisy Reverberant Speech Using
                 Polynomial Matrix Eigenvalue Decomposition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3255--3266",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Riccardo Giampiccolo and Mauro Giuseppe de Bari and
                 Alberto Bernardini and Augusto Sarti",
  title =        "Wave Digital Modeling and Implementation of Nonlinear
                 Audio Circuits With Nullors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3267--3279",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xixin Wu and Yuewen Cao and Hui Lu and Songxiang Liu
                 and Disong Wang and Zhiyong Wu and Xunying Liu and
                 Helen Meng",
  title =        "Speech Emotion Recognition Using Sequential Capsule
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3280--3291",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuan Gong and Yu-An Chung and James Glass",
  title =        "{PSLA}: Improving Audio Tagging With Pretraining,
                 Sampling, Labeling, and Aggregation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3292--3306",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Licheng Zhang and Zhendong Mao and Benfeng Xu and Quan
                 Wang and Yongdong Zhang",
  title =        "Review and Arrange: Curriculum Learning for Natural
                 Language Understanding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3307--3320",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Fei He and Ling He and Jing Zhang and Yuanyuan Li and
                 Xi Xiong",
  title =        "Automatic Detection of Affective Flattening in
                 Schizophrenia: Acoustic Correlates to Sound Waves and
                 Auditory Perception",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3321--3334",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Saoussen Mathlouthi Bouzid and Chiraz Ben Othmane
  title =        "Efficient Learning Approach for Pronominal Anaphora
                 and Ellipsis Identification and Resolution in {Arabic}
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3335--3348",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Arda Y{\"u}ksel and Berke U{\u{g}}urlu and Aykut
  title =        "Semantic Change Detection With {Gaussian} Word
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3349--3361",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mei Li and Lu Xiang and Xiaomian Kang and Yang Zhao
                 and Yu Zhou and Chengqing Zong",
  title =        "Medical Term and Status Generation From {Chinese}
                 Clinical Dialogue With Multi-Granularity Transformer",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3362--3374",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yongwei Li and Jianhua Tao and Donna Erickson and Bin
                 Liu and Masato Akagi",
  title =        "{$ F_0 $}-Noise-Robust Glottal Source and Vocal Tract
                 Analysis Based on {ARX-LF} Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3375--3383",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xianwen Liao and Yongzhong Huang and Yongzhuang Wei
                 and Chenhao Zhang and Fu Wang and Yong Wang",
  title =        "Efficient Estimate of Sentence's Representation Based
                 on the Difference Semantics Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3384--3399",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kwang Myung Jeon and Geon Woo Lee and Nam Kyun Kim and
                 Hong Kook Kim",
  title =        "{TAU-Net}: Temporal Activation {$U$}-Net Shared With
                 Nonnegative Matrix Factorization for Speech Enhancement
                 in Unseen Noise Environments",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3400--3414",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi-Yang Ding and Hao-Jian Lin and Li-Juan Liu and
                 Zhen-Hua Ling and Yu Hu",
  title =        "Robustness of Speech Spoofing Detectors Against
                 Adversarial Post-Processing of Voice Conversion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3415--3426",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi Zhou and Xiaohai Tian and Haizhou Li",
  title =        "Language Agnostic Speaker Embedding for Cross-Lingual
                 Personalized Speech Generation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3427--3439",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ju Lin and Adriaan J. de Lind van Wijngaarden and
                 Kuang-Ching Wang and Melissa C. Smith",
  title =        "Speech Enhancement Using Multi-Stage Self-Attentive
                 Temporal Convolutional Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3440--3450",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wei-Ning Hsu and Benjamin Bolte and Yao-Hung Hubert
                 Tsai and Kushal Lakhotia and Ruslan Salakhutdinov and
                 Abdelrahman Mohamed",
  title =        "{HuBERT}: Self-Supervised Speech Representation
                 Learning by Masked Prediction of Hidden Units",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3451--3460",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kouei Yamaoka and Nobutaka Ono and Shoji Makino",
  title =        "Time-Frequency-Bin-Wise Linear Combination of
                 Beamformers for Distortionless Signal Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3461--3475",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhong-Qiu Wang and Gordon Wichern and Jonathan {Le
  title =        "Convolutive Prediction for Monaural Speech
                 Dereverberation and Noisy-Reverberant Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3476--3490",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bing Yang and Hong Liu and Xiaofei Li",
  title =        "Learning Deep Direct-Path Relative Transfer Function
                 for Binaural Sound Source Localization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3491--3503",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yiming Cui and Wanxiang Che and Ting Liu and Bing Qin
                 and Ziqing Yang",
  title =        "Pre-Training With Whole Word Masking for {Chinese}
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3504--3514",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Leda {Sar } and Mark Hasegawa-Johnson and Chang D.
  title =        "Counterfactually Fair Automatic Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3515--3525",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhuohuang Zhang and Yong Xu and Meng Yu and Shi-Xiong
                 Zhang and Lianwu Chen and Donald S. Williamson and Dong
  title =        "Multi-Channel Multi-Frame {ADL-MVDR} for Target Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3526--3540",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Nils L. Westhausen and Rainer Huber and Hannah
                 Baumgartner and Ragini Sinha and Jan Rennies and Bernd
                 T. Meyer",
  title =        "Reduction of Subjective Listening Effort for {TV}
                 Broadcast Signals With Recurrent Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3541--3550",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shota Sasaki and Jun Suzuki and Kentaro Inui",
  title =        "Subword-Based Compact Reconstruction for
                 Open-Vocabulary Neural Word Embeddings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3551--3564",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaodong Cui and Wei Zhang and Abdullah Kayi and
                 Mingrui Liu and Ulrich Finkler and Brian Kingsbury and
                 George Saon and David Kung",
  title =        "Asynchronous Decentralized Distributed Training of
                 Acoustic Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3565--3576",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Junqing Zhang and Wen Zhang and Jihui Aimee Zhang and
                 Thushara Dheemantha Abhayapala and Lijun Zhang",
  title =        "Spatial Active Noise Control in Rooms Using Higher
                 Order Sources",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3577--3591",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bingzhi Chen and Qi Cao and Mixiao Hou and Zheng Zhang
                 and Guangming Lu and David Zhang",
  title =        "Multimodal Emotion Recognition With Temporal and
                 Semantic Consistency",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3592--3603",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "S. Supraja and Andy W. H. Khong and S. Tatinati",
  title =        "Regularized Phrase-Based Topic Model for Automatic
                 Question Classification With Domain-Agnostic Class
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3604--3616",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Natsuko Maeda and Filippo Maria Fazi and Falk-Martin
  title =        "Sound Field Reproduction With a Cylindrical
                 Loudspeaker Array Using First Order Wall Reflections",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3617--3630",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xugang Lu and Peng Shen and Yu Tsao and Hisashi
  title =        "Coupling a Generative Model With a Discriminative
                 Learning Framework for Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3631--3641",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hannes Helmholz and David Lou Alon and Sebasti{\`a} V.
                 Amengual Gar{\'\i} and Jens Ahrens",
  title =        "Effects of Additive Noise in Binaural Rendering of
                 Spherical Microphone Array Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3642--3653",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Joanna Hong and Minsu Kim and Se Jin Park and Yong Man
  title =        "Speech Reconstruction With Reminiscent Sound Via
                 Visual Voice Memory",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3654--3667",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ran Weisman and Tom Shlomo and Vladimir Tourbabin and
                 Paul Calamia and Boaz Rafaely",
  title =        "Robustness of Acoustic Rake Filters in Minimum
                 Variance Beamforming",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3668--3678",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Junhao Xu and Jianwei Yu and Shoukang Hu and Xunying
                 Liu and Helen Meng",
  title =        "Mixed Precision Low-Bit Quantization of Neural Network
                 Language Models for Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3679--3693",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jidong Ge and Yunyun Huang and Xiaoyu Shen and Chuanyi
                 Li and Wei Hu",
  title =        "Learning Fine-Grained Fact-Article Correspondence in
                 Legal Cases",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3694--3706",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qiuqiang Kong and Bochen Li and Xuchen Song and Yuan
                 Wan and Yuxuan Wang",
  title =        "High-Resolution Piano Transcription With Pedals by
                 Regressing Onset and Offset Times",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3707--3717",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{2021 Index \booktitle{IEEE/ACM Transactions on Audio,
                 Speech, and Language Processing Vol. 29}}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "29",
  number =       "??",
  pages =        "3718--3760",
  year =         "2021",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anonymous",
  title =        "{IEEE Signal Processing Society}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "C2--C2",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qianying Liu and Wenyu Guan and Sujian Li and Fei
                 Cheng and Daisuke Kawahara and Sadao Kurohashi",
  title =        "{RODA}: Reverse Operation Based Data Augmentation for
                 Solving Math Word Problems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1--11",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kai Zhen and Jongmo Sung and Mi Suk Lee and Seungkwon
                 Beack and Minje Kim",
  title =        "Scalable and Efficient Neural Speech Coding: a Hybrid
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "12--25",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sen Yang and Yang Liu and Dawei Feng and Dongsheng
  title =        "Text Generation From Data With Dynamic Planning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "26--34",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Stefan Liebich and Peter Vary",
  title =        "Occlusion Effect Cancellation in Headphones and
                 Hearing Devices The Sister of Active Noise
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "35--48",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhuosheng Zhang and Haojie Yu and Hai Zhao and Masao
  title =        "Which Apple Keeps Which Doctor Away? {Colorful} Word
                 Representations With Visual Oracles",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "49--59",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhenyu Wang and John H. L. Hansen",
  title =        "Multi-Source Domain Adaptation for Text-Independent
                 Forensic Speaker Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "60--75",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kengtao Zheng and Nankai Lin and Shengyi Jiang",
  title =        "Unsupervised Character Embedding Correction and
                 Candidate Word Denoising",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "76--86",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bing Ma and Haifeng Sun and Jingyu Wang and Qi Qi and
                 Jianxin Liao",
  title =        "Extractive Dialogue Summarization Without Annotation
                 Based on Distantly Supervised Machine Reading
                 Comprehension in Customer Service",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "87--97",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shengcai Liu and Ning Lu and Cheng Chen and Ke Tang",
  title =        "Efficient Combinatorial Optimization for Word-Level
                 Adversarial Textual Attack",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "98--111",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Alessandro Terenzi and Nicola Ortolani and In{\^e}s
                 Nolasco and Emmanouil Benetos and Stefania Cecchi",
  title =        "Comparison of Feature Extraction Methods for
                 Sound-Based Classification of Honey Bee Activity",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "112--122",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shuiyang Mao and P. C. Ching and Tan Lee",
  title =        "Enhancing Segment-Based Speech Emotion Recognition by
                 Iterative Self-Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "123--134",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Abdolreza Sabzi Shahrebabaki and Giampiero Salvi and
                 Torbj{\o}rn Svendsen and Sabato Marco Siniscalchi",
  title =        "Acoustic-to-Articulatory Mapping With Joint
                 Optimization of Deep Speech Enhancement and
                 Articulatory Inversion Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "135--147",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Javier Jorge and Adri{\`a} Gim{\'e}nez and Joan Albert
                 Silvestre-Cerd{\`a} and Jorge Civera and Albert Sanchis
                 and Alfons Juan",
  title =        "Live Streaming Speech Recognition Using Deep
                 Bidirectional {LSTM} Acoustic Models and Interpolated
                 Language Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "148--161",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Muhammed P. V. Shifas and C{\u{a}}t{\u{a}}lin
                 Zoril{\u{a}} and Yannis Stylianou",
  title =        "End-to-End Neural Based Modification of Noisy Speech
                 for Speech-in-Noise Intelligibility Improvement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "162--173",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Joon-Young Yang and Joon-Hyuk Chang",
  title =        "{VACE-WPE}: Virtual Acoustic Channel Expansion Based
                 on Neural Networks for Weighted Prediction Error-Based
                 Speech Dereverberation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "174--189",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chenpeng Du and Kai Yu",
  title =        "Phone-Level Prosody Modelling With {GMM}-Based {MDN}
                 for Diverse and Controllable Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "190--201",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Haibin Wu and Xu Li and Andy T. Liu and Zhiyong Wu and
                 Helen Meng and Hung-Yi Lee",
  title =        "Improving the Adversarial Robustness for Speaker
                 Verification by Self-Supervised Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "202--217",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mixiao Hou and Zheng Zhang and Qi Cao and David Zhang
                 and Guangming Lu",
  title =        "Multi-View Speech Emotion Recognition Via Collective
                 Relation Construction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "218--229",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Da-rong Liu and Po-chun Hsu and Yi-chen Chen and
                 Sung-feng Huang and Shun-po Chuang and Da-yi Wu and
                 Hung-yi Lee",
  title =        "Learning Phone Recognition From Unpaired Audio and
                 Phone Sequences Based on Generative Adversarial
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "230--243",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuting Zhao and Mamoru Komachi and Tomoyuki Kajiwara
                 and Chenhui Chu",
  title =        "Word-Region Alignment-Guided Multimodal Neural Machine
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "244--259",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhuosheng Zhang and Yiqing Zhang and Hai Zhao",
  title =        "Syntax-Aware Multi-Spans Generation for Reading
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "260--268",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Pengfei Zhu and Zhuosheng Zhang and Hai Zhao and
                 Xiaoguang Li",
  title =        "{DUMA}: Reading Comprehension With Transposition
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "269--279",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiayuan Xie and Ningxin Peng and Yi Cai and Tao Wang
                 and Qingbao Huang",
  title =        "Diverse Distractor Generation for Constructing
                 High-Quality Multiple Choice Questions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "280--291",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jie Zhang and Guanghui Zhang",
  title =        "A Parametric Unconstrained Beamformer Based Binaural
                 Noise Reduction for Assistive Hearing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "292--304",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Luca Turchet and Johan Pauwels",
  title =        "Music Emotion Recognition: Intention of
                 Composers-Performers Versus Perception of Musicians,
                 Non-Musicians, and Listening Machines",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "305--316",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wenxin Hou and Han Zhu and Yidong Wang and Jindong
                 Wang and Tao Qin and Renjun Xu and Takahiro Shinozaki",
  title =        "Exploiting Adapters for Cross-Lingual Low-Resource
                 Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "317--329",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kehai Chen and Rui Wang and Masao Utiyama and Eiichiro
  title =        "Integrating Prior Translation Knowledge Into Neural
                 Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "330--339",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Keqi Deng and Gaofeng Cheng and Runyan Yang and
                 Yonghong Yan",
  title =        "Alleviating {ASR} Long-Tailed Problem by Decoupling
                 the Learning of Representation and Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "340--354",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zuchao Li and Junru Zhou and Hai Zhao and Kevin
  title =        "{HPSG}-Inspired Joint Neural Constituent and
                 Dependency Parsing in {$ O(n^3) $} Time Complexity",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "355--366",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xuan Shi and Erica Cooper and Junichi Yamagishi",
  title =        "Use of Speaker Recognition Approaches for Learning and
                 Evaluating Embedding Representations of Musical
                 Instrument Sounds",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "367--377",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zengwei Yao and Wenjie Pei and Fanglin Chen and
                 Guangming Lu and David Zhang",
  title =        "Stepwise-Refining Speech Separation Network via
                 Fine-Grained Encoding in High-Order Latent Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "378--393",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yanmin Qian and Zhikai Zhou",
  title =        "Optimizing Data Usage for Low-Resource Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "394--403",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Narla John Metilda Sagaya Mary and Srinivasan Umesh
                 and Sandesh Varadaraju Katta",
  title =        "{S}-Vectors and {TESA}: Speaker Embeddings and a
                 Speaker Authenticator Based on Transformer Encoder",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "404--413",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bengt J. Borgstr{\"o}m",
  title =        "{Bayesian} Estimation of {PLDA} in the Presence of
                 Noisy Training Labels, With Applications to Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "414--428",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Menglong Lu and Zhen Huang and Binyang Li and Yunxiang
                 Zhao and Zheng Qin and DongSheng Li",
  title =        "{SIFTER}: a Framework for Robust Rumor Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "429--442",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lantian Li and Dong Wang and Jiawen Kang and Renyu
                 Wang and Jing Wu and Zhendong Gao and Xiao Chen",
  title =        "A Principle Solution for Enroll-Test Mismatch in
                 Speaker Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "443--455",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Feiran Yang",
  title =        "Analysis of Deficient-Length Partitioned-Block
                 Frequency-Domain Adaptive Filters",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "456--467",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hui Jiang and Linfeng Song and Yubin Ge and Fandong
                 Meng and Junfeng Yao and Jinsong Su",
  title =        "An {AST} Structure Enhanced Decoder for Code
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "468--476",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anssi Kanervisto and Ville Hautam{\"a}ki and Tomi
                 Kinnunen and Junichi Yamagishi",
  title =        "Optimizing Tandem Speaker Verification and
                 Anti-Spoofing Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "477--488",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xin Ni and Jia Ren",
  title =        "{FC-U2-Net}: a Novel Deep Neural Network for Singing
                 Voice Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "489--494",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Neil Zeghidour and Alejandro Luebs and Ahmed Omran and
                 Jan Skoglund and Marco Tagliasacchi",
  title =        "{SoundStream}: an End-to-End Neural Audio Codec",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "495--507",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wageesha Manamperi and Thushara D. Abhayapala and
                 Jihui Zhang and Prasanga N. Samarasinghe",
  title =        "Drone Audition: Sound Source Localization Using
                 On-Board Microphones",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "508--519",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qian Li and Hao Peng and Jianxin Li and Jia Wu and
                 Yuanxing Ning and Lihong Wang and Philip S. Yu and
                 Zheng Wang",
  title =        "Reinforcement Learning-Based Dialogue Guided Event
                 Extraction to Exploit Argument Relations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "520--533",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Santiago Ruiz and Toon van Waterschoot and Marc
  title =        "Distributed Combined Acoustic Echo Cancellation and
                 Noise Reduction in Wireless Acoustic Sensor and
                 Actuator Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "534--547",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lukas Grinewitschus and Peter Jung",
  title =        "The Harmonic Shift Algorithm for Efficient Multi-Pitch
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "548--561",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ziyao Lu and Xiang Li and Yang Liu and Chulun Zhou and
                 Jianwei Cui and Bin Wang and Min Zhang and Jinsong Su",
  title =        "Exploring Multi-Stage Information Interactions for
                 Multi-Source Neural Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "562--570",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jingxuan Yang and Si Li and Sheng Gao and Jun Guo",
  title =        "{CorefDPR}: a Joint Model for Coreference Resolution
                 and Dropped Pronoun Recovery in {Chinese}
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "571--581",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Timu{\c{c}}in Berk Atalay and Z{\"u}hre S{\"u} G{\"u}l
                 and Enzo {De Sena} and Zoran Cvetkovi{\'c} and
                 H{\"u}seyin Hac{\i}habibo{\u{g}}lu",
  title =        "Scattering Delay Network Simulator of Coupled Volume
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "582--593",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi Zhang and Lei Li and Yunfang Wu and Qi Su and Xu
  title =        "Alleviating the Knowledge-Language Inconsistency: a
                 Study for Deep Commonsense Knowledge",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "594--604",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ke Tan and Zhong-Qiu Wang and DeLiang Wang",
  title =        "Neural Spectrospatial Filtering",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "605--621",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qianren Mao and Jianxin Li and Chenghua Lin and
                 Congwen Chen and Hao Peng and Lihong Wang and Philip S.
  title =        "Adaptive Pre-Training and Collaborative Fine-Tuning: a
                 Win-Win Strategy to Improve Review Analysis Tasks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "622--634",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zifeng Cheng and Zhiwei Jiang and Yafeng Yin and Cong
                 Wang and Qing Gu",
  title =        "Learning to Classify Open Intent via Soft Labeling and
                 Manifold Mixup",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "635--645",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaochun An and Frank K. Soong and Lei Xie",
  title =        "Disentangling Style and Speaker Attributes for {TTS}
                 Style Transfer",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "646--658",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhuang Chen and Tieyun Qian",
  title =        "Retrieve-and-Edit Domain Adaptation for {End2End}
                 Aspect Based Sentiment Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "659--672",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jian Liu and Mengshi Yu and Yufeng Chen and Jinan Xu",
  title =        "Cross-Domain Slot Filling as Machine Reading
                 Comprehension: a New Perspective",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "673--685",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yongkang Liu and Qingbao Huang and Jing Li and
                 Linzhang Mo and Yi Cai and Qing Li",
  title =        "{SSAP}: Storylines and Sentiment Aware Pre-Trained
                 Model for Story Ending Generation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "686--694",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ying Zhou and Xuefeng Liang and Yu Gu and Yifei Yin
                 and Longshan Yao",
  title =        "Multi-Classifier Interactive Learning for Ambiguous
                 Speech Emotion Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "695--705",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Poul Hoang and Jan Mark de Haan and Zheng-Hua Tan and
                 Jesper Jensen",
  title =        "Multichannel Speech Enhancement With Own Voice-Based
                 Interfering Speech Suppression for Hearing Assistive
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "706--720",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Weijie Yu and Chen Xu and Jun Xu and Liang Pang and
                 Ji-Rong Wen",
  title =        "Distribution Distance Regularized Sequence
                 Representation for Text Matching in Asymmetrical
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "721--733",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Heming Wang and DeLiang Wang",
  title =        "Neural Cascade Architecture With Triple-Domain Loss
                 for Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "734--743",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Riccardo R. {De Lucia} and Antonio Canclini and Fabio
                 Antonacci and Augusto Sarti",
  title =        "Group Dictionary Equivalent Source Method for Sparse
                 Nearfield Acoustic Holography",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "744--757",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tong Ma and Ying Wei and Xin Lou",
  title =        "Reconfigurable Nonuniform Filter Bank for Hearing Aid
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "758--771",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Victoria Mingote and Antonio Miguel and Dayana Ribas
                 and Alfonso Ortega and Eduardo Lleida",
  title =        "{aDCF} Loss Function for Deep Metric Learning in
                 End-to-End Text-Dependent Speaker Verification
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "772--784",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Quansheng Tu and Huawei Chen",
  title =        "Theoretical Lower Bounds on the Performance of the
                 First-Order Differential Microphone Arrays With Sensor
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "785--801",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Taihui Wang and Feiran Yang and Jun Yang",
  title =        "Convolutive Transfer Function-Based Multichannel
                 Nonnegative Matrix Factorization for Overdetermined
                 Blind Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "802--815",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi Zhang and Guangyou Zhou and Zhiwen Xie and Jimmy
                 Xiangji Huang",
  title =        "{HGEN}: Learning Hierarchical Heterogeneous Graph
                 Encoding for Math Word Problem Solving",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "816--828",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Eduardo Fonseca and Xavier Favory and Jordi Pons and
                 Frederic Font and Xavier Serra",
  title =        "{FSD50K}: an Open Dataset of Human-Labeled Sound
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "829--852",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi Lei and Shan Yang and Xinsheng Wang and Lei Xie",
  title =        "{MsEmoTTS}: Multi-Scale Emotion Transfer, Prediction,
                 and Control for Emotional Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "853--864",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tao Wang and Ruibo Fu and Jiangyan Yi and Jianhua Tao
                 and Zhengqi Wen",
  title =        "{NeuralDPS}: Neural Deterministic Plus Stochastic
                 Model With Multiband Excitation for Noise-Controllable
                 Waveform Generation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "865--878",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Simon Stone and Yingming Gao and Peter Birkholz",
  title =        "Articulatory Synthesis of Vocalized {\tt /r/}
                 Allophones in {German}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "879--889",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Prashant Serai and Vishal Sunder and Eric
  title =        "Hallucination of Speech Recognition Errors With
                 Sequence to Sequence Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "890--900",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bin Wu and Sakriani Sakti and Jinsong Zhang and
                 Satoshi Nakamura",
  title =        "Modeling Unsupervised Empirical Adaptation by {DPGMM}
                 and {DPGMM-RNN} Hybrid Model to Extract Perceptual
                 Features for Low-Resource {ASR}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "901--916",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mi Zhang and Tieyun Qian and Bing Liu",
  title =        "Exploit Feature and Relation Hierarchy for Relation
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "917--930",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wenxiang Jiao and Xing Wang and Shilin He and Zhaopeng
                 Tu and Irwin King and Michael R. Lyu",
  title =        "Exploiting Inactive Examples for Natural Language
                 Generation With Data Rejuvenation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "931--943",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Youzhi Tu and Man-Wai Mak",
  title =        "Aggregating Frame-Level Information in the Spectral
                 Domain With Self-Attention for Speaker Embedding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "944--957",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhixing Tan and Zeyuan Yang and Meng Zhang and Qun Liu
                 and Maosong Sun and Yang Liu",
  title =        "Dynamic Multi-Branch Layers for On-Device Neural
                 Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "958--967",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Weiwei Lin and Man-Wai Mak",
  title =        "Mixture Representation Learning for Deep Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "968--978",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Peng Zhu and Dawei Cheng and Fangzhou Yang and Yifeng
                 Luo and Dingjiang Huang and Weining Qian and Aoying
  title =        "Improving {Chinese} Named Entity Recognition by
                 Large-Scale Syntactic Dependency Graph",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "979--991",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaobo Liang and Lijun Wu and Juntao Li and Tao Qin
                 and Min Zhang and Tie-Yan Liu",
  title =        "Multi-Teacher Distillation With Single Model for
                 Neural Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "992--1002",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaofeng Chen and Guohua Wang and Haopeng Ren and Yi
                 Cai and Ho-fung Leung and Tao Wang",
  title =        "Task-Adaptive Feature Fusion for Generalized Few-Shot
                 Relation Classification in an Open World Environment",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1003--1015",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yu-Chen Lin and Cheng Yu and Yi-Te Hsu and Szu-Wei Fu
                 and Yu Tsao and Tei-Wei Kuo",
  title =        "{SEOFP-NET}: Compression and Acceleration of Deep
                 Neural Networks for Speech Enhancement Using
                 Sign-Exponent-Only Floating-Points",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1016--1031",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    ";
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tomohiro Nakatani and Rintaro Ikeshita and Keisuke
                 Kinoshita and Hiroshi Sawada and Naoyuki Kamo and Shoko
  title =        "Switching Independent Vector Analysis and its
                 Extension to Blind and Spatially Guided Convolutional
                 Beamforming Algorithms",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1032--1047",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jianhua Geng and Sifan Wang and Qinglai Liu and Xin
  title =        "Multi-Level Time-Frequency Bins Selection for
                 Direction of Arrival Estimation Using a Single Acoustic
                 Vector Sensor",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1048--1060",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qinzhuo Wu and Qi Zhang and Xuanjing Huang",
  title =        "Automatic Math Word Problem Generation With
                 Topic-Expression Co-Attention Mechanism and
                 Reinforcement Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1061--1072",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Michael Nigro and Sridhar Krishnan",
  title =        "Multimodal System for Audio Scene Source Counting and
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1073--1082",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yishu Peng and Sheng Zhang and Jiashu Zhang and Wei
                 Xing Zheng",
  title =        "Combined-Sample Multiband-Structured Subband Filtering
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1083--1092",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shoukang Hu and Xurong Xie and Mingyu Cui and Jiajun
                 Deng and Shansong Liu and Jianwei Yu and Mengzhe Geng
                 and Xunying Liu and Helen Meng",
  title =        "Neural Architecture Search for {LF-MMI} Trained Time
                 Delay Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1093--1107",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xudong Dang and Wen Ma and Emanu{\"e}l A. P. Habets
                 and Hongyan Zhu",
  title =        "{TDOA}-Based Robust Sound Source Localization With
                 Sparse Regularization in Wireless Acoustic Sensor
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1108--1123",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shan Gao and Jing Lin and Xihong Wu and Tianshu Qu",
  title =        "Sparse {DNN} Model for Frequency Expanding of Higher
                 Order Ambisonics Encoding Process",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1124--1135",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Giovanni Pepe and Leonardo Gabrielli and Stefano
                 Squartini and Carlo Tripodi and Nicol{\`o} Strozzi",
  title =        "Deep Optimization of Parametric {IIR} Filters for
                 Audio Equalization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1136--1149",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Moa Lee and Junmo Lee and Joon-Hyuk Chang",
  title =        "Non-Autoregressive Fully Parallel Deep Convolutional
                 Neural Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1150--1159",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Liam Barrett and Junchao Hu and Peter Howell",
  title =        "Systematic Review of Machine Learning Approaches for
                 Detecting Developmental Stuttering",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1160--1172",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sang-Hoon Lee and Hyeong-Rae Noh and Woo-Jeoung Nam
                 and Seong-Whan Lee",
  title =        "Duration Controllable Voice Conversion via
                 Phoneme-Based Information Bottleneck",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1173--1183",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhihong Shao and Zhongqin Wu and Minlie Huang",
  title =        "{AdvExpander}: Generating Natural Language Adversarial
                 Examples by Expanding Text",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1184--1196",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dhanunjaya Varma Devalraju and Padmanabhan Rajan",
  title =        "Multiview Embeddings for Soundscape Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1197--1206",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chengyu Wang and Suyang Dai and Yipeng Wang and Fei
                 Yang and Minghui Qiu and Kehan Chen and Wei Zhou and
                 Jun Huang",
  title =        "{ARoBERT}: an {ASR} Robust Pre-Trained Language Model
                 for Spoken Language Understanding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1207--1218",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jonah Ong and Ba Tuong Vo and Sven Nordholm and Ba-Ngu
                 Vo and Diluka Moratuwage and Changbeom Shim",
  title =        "Audio-Visual Based Online Multi-Source Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1219--1234",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Leyang Cui and Yafu Li and Yue Zhang",
  title =        "Label Attention Network for Structured Prediction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1235--1248",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sarinah Sutojo and Tobias May and Steven van de Par",
  title =        "Segmentation of Multitalker Mixtures Based on Local
                 Feature Contrasts and Auditory Glimpses",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1249--1262",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hao Gao and Xuelei Feng and Yong Shen",
  title =        "Weighted Loudspeaker Placement Method for Sound Field
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1263--1276",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Gongping Huang and Jacob Benesty and Israel Cohen and
                 Jingdong Chen",
  title =        "{Kronecker} Product Multichannel Linear Filtering for
                 Adaptive Weighted Prediction Error-Based Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1277--1289",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Takehiro Sugimoto",
  title =        "Loudness-Level-Chasing Algorithm for Multiformat Live
                 Audio Production",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1290--1304",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Junshuang Wu and Richong Zhang and Yongyi Mao and
                 Jinpeng Huai",
  title =        "Dealing With Hierarchical Types and Label Noise in
                 Fine-Grained Entity Typing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1305--1318",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anton Ragni and Mark J. F. Gales and Oliver Rose and
                 Katherine M. Knill and Alexandros Kastanos and Qiujia
                 Li and Preben M. Ness",
  title =        "Increasing Context for Estimating Confidence Scores in
                 Automatic Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1319--1329",
  year =         "2022",
  CODEN =        "????",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Thu Apr 7 10:27:19 2022",
  bibsource =    "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhongxin Bai and Jianyu Wang and Xiao-Lei Zhang and
                 Jingdong Chen",
  title =        "End-to-End Speaker Verification via Curriculum
                 Bipartite Ranking Weighted Binary Cross-Entropy",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1330--1344",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "End-to-end speaker verification achieves the
                 verification through estimating directly the similarity
                 score between a pair of utterances, which is formulated
                 as a binary (i.e., target versus non-target)
                 classification problem. Unlike the stage-wise method,
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shang-Yi Chuang and Hsin-Min Wang and Yu Tsao",
  title =        "Improved {Lite} Audio-Visual Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1345--1359",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Numerous studies have investigated the effectiveness
                 of audio-visual multimodal learning for speech
                 enhancement (AVSE) tasks, seeking a solution that uses
                 visual data as auxiliary and complementary input to
                 reduce the noise of noisy speech signals. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Gaofeng Cheng and Haoran Miao and Runyan Yang and Keqi
                 Deng and Yonghong Yan",
  title =        "{ETEH}: Unified Attention-Based End-to-End {ASR} and
                 {KWS} Architecture",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1360--1373",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Even though attention-based end-to-end (E2E) automatic
                 speech recognition (ASR) models have been yielding
                 state-of-the-art recognition accuracy, they still fall
                 behind many of the ASR models deployed in the industry
                 in some crucial functionalities such as \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ashutosh Pandey and DeLiang Wang",
  title =        "Self-Attending {RNN} for Speech Enhancement to Improve
                 Cross-Corpus Generalization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1374--1385",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Deep neural networks (DNNs) represent the mainstream
                 methodology for supervised speech enhancement,
                 primarily due to their capability to model complex
                 functions using hierarchical representations. However,
                 a recent study revealed that DNNs trained on a
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Di Jin and Shuyang Gao and Seokhwan Kim and Yang Liu
                 and Dilek Hakkani-T{\"u}r",
  title =        "Towards Textual Out-of-Domain Detection Without
                 In-Domain Labels",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1386--1395",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "In many real-world settings, machine learning models
                 need to identify user inputs that are out-of-domain
                 (OOD) so as to avoid performing wrong actions. This
                 work focuses on a challenging case of OOD detection,
                 where no labels for in-domain data are \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "K. Mrinalini and P. Vijayalakshmi and T. Nagarajan",
  title =        "{SBSim}: a {Sentence-BERT} Similarity-Based Evaluation
                 Metric for {Indian} Language Neural Machine Translation
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1396--1406",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Machine translation (MT) outputs are widely scored
                 using automatic evaluation metrics and human evaluation
                 scores. The automatic evaluation metrics are expected
                 to be easily computable and a reflection of human
                 evaluation. Traditional string-based metrics \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Changhong Wang and Emmanouil Benetos and Vincent
                 Lostanlen and Elaine Chew",
  title =        "Adaptive Scattering Transforms for Playing Technique
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1407--1421",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Playing techniques contain distinctive information
                 about musical expressivity and interpretation. Yet,
                 current research in music signal analysis suffers from
                 a scarcity of computational models for playing
                 techniques, especially in the context of live
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Danwei Cai and Weiqing Wang and Ming Li",
  title =        "Incorporating Visual Information in Audio Based
                 Self-Supervised Speaker Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1422--1435",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "The current success of deep learning largely benefits
                 from the availability of large amount of labeled data.
                 However, collecting a large-scale dataset with human
                 annotation can be expensive and sometimes difficult.
                 Self-supervised learning thus attracts \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yu Luo and Lina Pu",
  title =        "{EC-ANC}: Edge Case-Enhanced Active Noise Cancellation
                 for True Wireless Stereo Earbuds",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1436--1447",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, we propose an edge case-enhanced active
                 noise cancellation (EC-ANC) system that integrates a
                 piezo microphone, a signal processor, and a wireless
                 module into the charging case of TWS earbuds.
                 Considering the fact that sound travels much \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tao Li and Xinsheng Wang and Qicong Xie and Zhichao
                 Wang and Lei Xie",
  title =        "Cross-Speaker Emotion Disentangling and Transfer for
                 End-to-End Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1448--1460",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "The cross-speaker emotion transfer task in
                 text-to-speech (TTS) synthesis particularly aims to
                 synthesize speech for a target speaker with the emotion
                 transferred from reference speech recorded by another
                 (source) speaker. During the emotion transfer
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yilin Zhao and Zhuosheng Zhang and Hai Zhao",
  title =        "Reference Knowledgeable Network for Machine Reading
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1461--1473",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Multi-choice Machine Reading Comprehension (MRC) as a
                 challenge requires models to select the most
                 appropriate answer from a set of candidates with a
                 given passage and question. Most of the existing
                 researches focus on the modeling of specific tasks or
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Fu-Hao Yu and Kuan-Yu Chen and Ke-Han Lu",
  title =        "Non-Autoregressive {ASR} Modeling Using Pre-Trained
                 Language Models for {Chinese} Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1474--1482",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Transformer-based models have led to significant
                 innovation in various classic and practical subjects,
                 including speech processing, natural language
                 processing, and computer vision. On top of the
                 Transformer, attention-based end-to-end automatic
                 speech \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yiming Cui and Ting Liu and Wanxiang Che and Zhigang
                 Chen and Shijin Wang",
  title =        "Teaching Machines to Read, Answer and Explain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1483--1492",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "With various Pre-trained Language Models (PLMs)
                 blooming, Machine Reading Comprehension (MRC) systems
                 have embraced significant improvements on various
                 benchmarks and even surpassed human performances.
                 However, most existing works only focus on the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shota Horiguchi and Yusuke Fujita and Shinji Watanabe
                 and Yawen Xue and Paola Garc{\'\i}a",
  title =        "Encoder-Decoder Based Attractors for End-to-End Neural
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1493--1507",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "This paper investigates an end-to-end neural
                 diarization (EEND) method for an unknown number of
                 speakers. In contrast to the conventional cascaded
                 approach to speaker diarization, EEND methods are
                 better in terms of speaker overlap handling. However,
                 EEND \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chenda Li and Zhuo Chen and Yanmin Qian",
  title =        "Dual-Path Modeling With Memory Embedding Model for
                 Continuous Speech Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1508--1520",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Continuous speech separation (CSS) aims at separating
                 overlap-free targets from a long, partially-overlapped
                 recording. Though it has shown promising results, the
                 origin CSS framework does not consider cross-window
                 information and long-span dependency. To \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yu Tong and Jingzhi Guo and Jizhe Zhou",
  title =        "Separation Inference: a Unified Framework for Word
                 Segmentation in {East} {Asian} Languages",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "30",
  number =       "??",
  pages =        "1521--1530",
  year =         "2022",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:28:53 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Existing methods consider Word Segmentation (WS) as
                 sequence tagging. Each tag indicates the position of
                 the current character in a segment. The exactness of
                 the position for any non-boundaries character is
                 unnecessary. Any incorrect inner prediction \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mrinmoy Bhattacharjee and S. R. M. Prasanna and
                 Prithwijit Guha",
  title =        "Clean vs. Overlapped Speech-Music Detection Using
                 Harmonic-Percussive Features and Multi-Task Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1--10",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Detection of speech and music signals in isolated and
                 overlapped conditions is an essential preprocessing
                 step for many audio applications. Speech signals have
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhaojie Luo and Shoufeng Lin and Rui Liu and Jun Baba
                 and Yuichiro Yoshikawa and Hiroshi Ishiguro",
  title =        "Decoupling Speaker-Independent Emotions for Voice
                 Conversion via Source-Filter Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "11--24",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Emotional voice conversion (VC) aims to convert a
                 neutral voice to an emotional one while retaining the
                 linguistic information and speaker identity. We note
                 that \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jinchuan Tian and Jianwei Yu and Chao Weng and Yuexian
                 Zou and Dong Yu",
  title =        "Integrating Lattice-Free {MMI} Into End-to-End Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "25--38",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "In automatic speech recognition (ASR) research,
                 discriminative criteria have achieved superior
                 performance in DNN-HMM systems. Given this success, the
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ravi Shankar and Hsi-Wei Hsieh and Nicolas Charon and
                 Archana Venkataraman",
  title =        "A Diffeomorphic Flow-Based Variational Framework for
                 Multi-Speaker Emotion Conversion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "39--53",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "This paper introduces a new framework for non-parallel
                 emotion conversion in speech. Our framework is based on
                 two key contributions. First, we propose a \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ryandhimas E. Zezario and Szu-Wei Fu and Fei Chen and
                 Chiou-Shann Fuh and Hsin-Min Wang and Yu Tsao",
  title =        "Deep Learning-Based Non-Intrusive Multi-Objective
                 Speech Assessment Model With Cross-Domain Features",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "54--70",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "This study proposes a cross-domain multi-objective
                 speech assessment model, called MOSA-Net, which can
                 simultaneously estimate the speech quality, \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaoyi Qin and Danwei Cai and Ming Li",
  title =        "Robust Multi-Channel Far-Field Speaker Verification
                 Under Different In-Domain Data Availability Scenarios",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "71--85",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "The popularity and application of smart home devices
                 have made far-field speaker verification an urgent
                 need. However, speaker verification performance is
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Vikram C. Mathad and Julie M. Liss and Kathy Chapman
                 and Nancy Scherer and Visar Berisha",
  title =        "Consonant-Vowel Transition Models Based on Deep
                 Learning for Objective Evaluation of Articulation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "86--95",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Spectro-temporal dynamics of consonant-vowel (CV)
                 transition regions are considered to provide robust
                 cues related to articulation. In this work, we propose
                 an \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Li Li and Hirokazu Kameoka and Shoji Makino",
  title =        "{FastMVAE2}: On Improving and Accelerating the Fast
                 Variational Autoencoder-Based Source Separation
                 Algorithm for Determined Mixtures",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "96--110",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "This article proposes a new source model and training
                 scheme to improve the accuracy and speed of the
                 multichannel variational autoencoder (MVAE) method. The
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jie Wang and Yan Yang and Keyu Liu and Zhiping Zhu and
                 Xiaorong Liu",
  title =        "{M3S}: Scene Graph Driven Multi-Granularity Multi-Task
                 Learning for Multi-Modal {NER}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "111--120",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Multi-modal Named Entity Recognition (MNER), which
                 mainly focuses on enhancing text-only NER with visual
                 information, has recently attracted considerable \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Marc Delcroix and Jorge Bennasar Vazquez and Tsubasa
                 Ochiai and Keisuke Kinoshita and Yasunori Ohishi and
                 Shoko Araki",
  title =        "{SoundBeam}: Target Sound Extraction Conditioned on
                 Sound-Class Labels and Enrollment Clues for Increased
                 Performance and Continuous Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "121--136",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "In many situations, we would like to hear desired
                 sound events (SEs) while being able to ignore
                 interference. Target sound extraction (TSE) tackles
                 this \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Daisuke Niizumi and Daiki Takeuchi and Yasunori Ohishi
                 and Noboru Harada and Kunio Kashino",
  title =        "{BYOL} for Audio: Exploring Pre-Trained
                 General-Purpose Audio Representations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "137--151",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Pre-trained models are essential as feature extractors
                 in modern machine learning systems in various domains.
                 In this study, we hypothesize that representations
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yingrui Xu and Hao Liu and Jingguo Ge and Xiaodan
                 Zhang and Jingyuan Hu and Yulei Wu and Honglei Lv and
                 Hongbin Shi and Wei Zhou",
  title =        "Mining Weak Relations Between Reviews for Opinion Spam
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "152--162",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Online reviews play a significant role in purchase
                 decisions of consumers by providing feedback
                 information from buyers of products. In order to
                 mislead \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yoshiki Masuyama and Kohei Yatabe and Kento Nagatomo
                 and Yasuhiro Oikawa",
  title =        "Online Phase Reconstruction via {DNN-Based} Phase
                 Differences Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "163--176",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "This paper presents a two-stage online phase
                 reconstruction framework using causal deep neural
                 networks (DNNs). Phase reconstruction is a task of
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiang Liu and Donghong Ji and Jingye Li and Dongdong
                 Xie and Chong Teng and Liang Zhao and Fei Li",
  title =        "{TOE}: a Grid-Tagging Discontinuous {NER} Model
                 Enhanced by Embedding {Tag\slash} Word Relations and
                 More Fine-Grained Tags",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "177--187",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "So far, discontinuous named entity recognition (NER)
                 has received increasing research attention and many
                 related methods have surged such as \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhe Hu and Zhiwei Cao and Hou Pong Chan and Jiachen
                 Liu and Xinyan Xiao and Jinsong Su and Hua Wu",
  title =        "Controllable Dialogue Generation With Disentangled
                 Multi-Grained Style Specification and Attribute
                 Consistency Reward",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "188--199",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Controllable text generation is an appealing but
                 challenging task, which allows users to specify
                 particular attributes of the generated outputs. In this
                 paper, we propose \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sondes Abderrazek and Corinne Fredouille and Alain
                 Ghio and Muriel Lalain and Christine Meunier and
                 Virginie Woisard",
  title =        "Interpreting Deep Representations of Phonetic Features
                 via Neuro-Based Concept Detector: Application to Speech
                 Disorders Due to Head and Neck Cancer",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "200--214",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "The popularity of Deep Neural Networks (DNNs) is
                 growing significantly, and so is the interest in
                 gaining a better understanding of their functioning. In
                 this work, it is \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jie Zhang and Rui Tao and Jun Du and Li-Rong Dai",
  title =        "Energy-Efficient Sparsity-Driven Speech Enhancement in
                 Wireless Acoustic Sensor Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "215--228",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Wireless acoustic sensor network (WASN) has shown a
                 superiority over conventional microphone arrays in many
                 aspects. There exists an important tradeoff \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xianke Wang and Bowen Tian and Weiming Yang and Wei Xu
                 and Wenqing Cheng",
  title =        "{MusicYOLO}: a Vision-Based Framework for Automatic
                 Singing Transcription",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "229--241",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Automatic singing transcription (AST), which refers to
                 the process of inferring the onset, offset, and pitch
                 from the singing audio, is of great significance in
                 music \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuanyuan Liu and Mittapalle Kiran Reddy and Nelly
                 Penttila and Tiina Ihalainen and Paavo Alku and Okko
  title =        "Automatic Assessment of {Parkinson\&\#x0027;s} Disease
                 Using Speech Representations of Phonation and
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "242--255",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech from people with Parkinson\&\#x0027;s disease
                 (PD) are likely to be degraded on phonation,
                 articulation, and prosody. Motivated to describe \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "David Sudholt and Alec Wright and Cumhur Erkut and
                 Vesa Valimaki",
  title =        "Pruning Deep Neural Network Models of Guitar
                 Distortion Effects",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "256--264",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Deep neural networks have been successfully used in
                 the task of black-box modeling of analog audio effects
                 such as distortion. Improving the processing speed
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Fangkai Jiao and Yangyang Guo and Minlie Huang and
                 Liqiang Nie",
  title =        "Enhanced Multi-Domain Dialogue State Tracker With
                 Second-Order Slot Interactions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "265--276",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Dialogue state tracking (DST) is often used to track
                 the system\&\#x0027;s understanding of the user goal in
                 task-oriented dialogue systems. \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hui Tian and Yiqin Qiu and Wojciech Mazurczyk and
                 Haizhou Li and Zhenxing Qian",
  title =        "{STFF-SM}: Steganalysis Model Based on Spatial and
                 Temporal Feature Fusion for Speech Streams",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "277--289",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "The real-time detection of speech steganography in
                 Voice-over-Internet-Protocol (VoIP) scenarios remains
                 an open problem, as it requires \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Gopendra Vikram Singh and Mauajama Firdaus and Asif
                 Ekbal and Pushpak Bhattacharyya",
  title =        "{EmoInt-Trans}: a Multimodal Transformer for
                 Identifying Emotions and Intents in Social
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "290--300",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "In the natural language processing community,
                 open-domain conversational agents, also known as
                 chatbots, are gaining popularity. One of the
                 difficulties \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "De De Hu and Huaiwen Zhang and Feilong Bao and Rui
  title =        "Distributed Sampling Rate Offset Estimation Over
                 Acoustic Sensor Networks Based on Asynchronous Network
                 {Newton} Optimization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "301--312",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Sampling rate synchronization is an inevitable issue
                 in distributed acoustic sensor networks. In this paper,
                 an analytical sampling rate offset (SRO) \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "David Diaz-Guerra and Antonio Miguel and Jose R.
  title =        "Direction of Arrival Estimation of Sound Sources Using
                 Icosahedral {CNNs}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "313--321",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, we present a new model for Direction of
                 Arrival (DOA) estimation of sound sources based on an
                 Icosahedral Convolutional Neural Network \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Peiming Guo and Shen Huang and Peijie Jiang and
                 Yueheng Sun and Meishan Zhang and Min Zhang",
  title =        "Curriculum-Style Fine-Grained Adaption for
                 Unsupervised Cross-Lingual Dependency Transfer",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "322--332",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Unsupervised cross-lingual transfer has been shown
                 great potentials for dependency parsing of the
                 low-resource languages when there is no annotated
                 treebank \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Naveen Kumar Desiraju and Simon Doclo and Markus Buck
                 and Tobias Wolff",
  title =        "Joint Online Estimation of Early and Late Residual
                 Echo {PSD} for Residual Echo Suppression",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "333--344",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "In hands-free telephony and other distant-talking
                 applications, an acoustic echo cancellation system is
                 typically required, where a short adaptive filter is
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Guangzhi Sun and Chao Zhang and Philip C. Woodland",
  title =        "Minimising Biasing Word Errors for Contextual {ASR}
                 With the Tree-Constrained Pointer Generator",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "345--354",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Contextual knowledge is essential for reducing speech
                 recognition errors on high-valued long-tail words. This
                 paper proposes a novel tree-constrained pointer \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jonah Casebeer and Nicholas J. Bryan and Paris
  title =        "{Meta-AF}: Meta-Learning for Adaptive Filters",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "355--370",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Adaptive filtering algorithms are pervasive throughout
                 signal processing and have had a material impact on a
                 wide variety of domains including audio \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yingwen Fu and Nankai Lin and Boyu Chen and Ziyu Yang
                 and Shengyi Jiang",
  title =        "Cross-Lingual Named Entity Recognition for
                 Heterogeneous Languages",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "371--382",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Previous works on cross-lingual Named Entity
                 Recognition (NER) have achieved great success. However,
                 few of them consider the effect of language \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jun-You Wang and Jyh-Shing Roger Jang",
  title =        "Training a Singing Transcription Model Using
                 Connectionist Temporal Classification Loss and
                 Cross-Entropy Loss",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "383--396",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, we propose a method that uses a
                 combination of the Connectionist Temporal
                 Classification (CTC) loss and the cross-entropy loss to
                 train a note-level singing transcription model. By
                 considering the task as predicting a note sequence of
                 the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhong-Qiu Wang and Gordon Wichern and Shinji Watanabe
                 and Jonathan Le Roux",
  title =        "{STFT-Domain} Neural Speech Enhancement With Very Low
                 Algorithmic Latency",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "397--410",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Deep learning based speech enhancement in the
                 short-time Fourier transform (STFT) domain typically
                 uses a large window length such as 32 ms. A larger
                 window can lead to higher frequency resolution and
                 potentially better enhancement. This however incurs an
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yu Li and Bojie Hu and Jian Liu and Yufeng Chen and
                 Jinan Xu",
  title =        "A Neighborhood Re-Ranking Model With Relation
                 Constraint for Knowledge Graph Completion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "411--425",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Knowledge graph completion (KGC) aims to predict
                 missing links based on observed triples. However,
                 current KGC models are still limited by the following
                 two aspects. (1) the entity semantics is implicitly
                 learned by neural network and merely depends on
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Alessio Miaschi and Dominique Brunato and Felice
                 Dell'Orletta and Giulia Venturi",
  title =        "On Robustness and Sensitivity of a Neural Language
                 Model: a Case Study on {Italian} {L1} Learner Errors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "426--438",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, we propose a comprehensive linguistic
                 study aimed at assessing the implicit behavior of one
                 of the most prominent Neural Language Models (NLM)
                 based on Transformer architectures, BERT Devlin et al.,
                 when dealing with a particular source of \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rong Xiao and Yu Wan and Baosong Yang and Haibo Zhang
                 and Huajin Tang and Derek F. Wong and Boxing Chen",
  title =        "Towards Energy-Preserving Natural Language
                 Understanding With Spiking Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "439--447",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Artificial neural networks have shown promising
                 results in a variety of natural language understanding
                 (NLU) tasks. Despite their successes, conventional
                 neural-based NLU models are criticized for high energy
                 consumption, making them laborious to be \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Juan Zhao and Tianrui Zong and Yong Xiang and
                 Longxiang Gao and Guang Hua and Keshav Sood and Yushu
  title =        "{SSVS-SSVD} Based Desynchronization Attacks Resilient
                 Watermarking Method for Stereo Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "448--461",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Most of the audio signals in real-world applications
                 are stereo signals. However, the previous
                 desynchronization attacks resilient watermarking
                 methods cannot preserve perceptual quality or achieve
                 robustness when constrained by high embedding rates and
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qiquan Zhang and Xinyuan Qian and Zhaoheng Ni and
                 Aaron Nicolson and Eliathamby Ambikairajah and Haizhou
  title =        "A Time-Frequency Attention Module for Neural Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "462--475",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech enhancement plays an essential role in a wide
                 range of speech processing applications. Recent studies
                 on speech enhancement tend to investigate how to
                 effectively capture the long-term contextual
                 dependencies of speech signals to boost performance.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Binhong Xie and Yu Li and Hongyan Zhao and Lihu Pan
                 and Enhui Wang",
  title =        "A Cross-Attention Fusion Based Graph Convolution
                 Auto-Encoder for Open Relation Extraction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "476--485",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Open Relation Extraction (OpenRE) aims at clustering
                 relation instances to extract relation types. By
                 learning relation patterns between named entities, it
                 clusters semantically equivalent patterns into a
                 unified relation cluster. Existing clustering-.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qian-Bei Hong and Chung-Hsien Wu and Hsin-Min Wang",
  title =        "Generalization Ability Improvement of Speaker
                 Representation and Anti-Interference for Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "486--499",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "The ability to generalize to mismatches between
                 training and testing conditions and resist interference
                 from other speakers is crucial for the performance of
                 speaker verification. In this paper, we propose two
                 novel approaches to improve the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xinglin Lyu and Junhui Li and Min Zhang and Chenchen
                 Ding and Hideki Tanaka and Masao Utiyama",
  title =        "Refining History for Future-Aware Neural Machine
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "500--512",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Neural machine translation uses a decoder to generate
                 target words auto-regressively by predicting the next
                 target word conditioned on a given source sentence and
                 its previously predicted target words, i.e, its
                 translation history, which suffers from two \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mou Wang and Junqi Chen and Xiao-Lei Zhang and Susanto
  title =        "End-to-End Multi-Modal Speech Recognition on an Air
                 and Bone Conducted Speech Corpus",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "513--524",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Automatic speech recognition (ASR) has been
                 significantly improved in the past years. However, most
                 robust ASR systems are based on air-conducted (AC)
                 speech, and their performances in low
                 signal-to-noise-ratio (SNR) conditions are not
                 satisfactory. Bone-. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Asier L{\'o}pez Zorrilla and Mar{\'\i}a In{\'e}s
                 Torres and Heriberto Cuay{\'a}huitl",
  title =        "Audio Embedding-Aware Dialogue Policy Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "525--538",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Following the success of Natural Language Processing
                 (NLP) transformers pretrained via self-supervised
                 learning, similar models have been proposed recently
                 for speech processing such as Wav2Vec2, HuBERT and
                 UniSpeech-SAT. An interesting yet unexplored \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xichen Shang and Chuxin Chen and Zipeng Chen and
                 Qianli Ma",
  title =        "Modularized Mutuality Network for Emotion-Cause Pair
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "539--549",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Emotion-cause pair extraction (ECPE) is an emerging
                 task born out of Emotion cause extraction (ECE), which
                 aims to extract the emotion clause and the
                 corresponding cause clause simultaneously. Previous
                 methods decompose ECPE into multiple sub-tasks,
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xinyuan Qian and Zhengdong Wang and Jiadong Wang and
                 Guohui Guan and Haizhou Li",
  title =        "Audio-Visual Cross-Attention Network for Robotic
                 Speaker Tracking",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "550--562",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Audio-visual signals can be used jointly for robotic
                 perception as they complement each other. Such
                 multi-modal sensory fusion has a clear advantage,
                 especially under noisy acoustic conditions. Speaker
                 localization, as an essential robotic function, was
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kristina Tesch and Timo Gerkmann",
  title =        "Insights Into Deep Non-Linear Filters for Improved
                 Multi-Channel Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "563--575",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "The key advantage of using multiple microphones for
                 speech enhancement is that spatial filtering can be
                 used to complement the tempo-spectral processing. In a
                 traditional setting, linear spatial filtering
                 (beamforming) and single-channel post-filtering
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Thilo von Neumann and Keisuke Kinoshita and Christoph
                 Boeddeker and Marc Delcroix and Reinhold Haeb-Umbach",
  title =        "Segment-Less Continuous Speech Separation of Meetings:
                 Training and Evaluation Criteria",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "576--589",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Continuous Speech Separation (CSS) has been proposed
                 to address speech overlaps during the analysis of
                 realistic meeting-like conversations by eliminating any
                 overlaps before further processing. CSS separates a
                 recording of arbitrarily many speakers into \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Davide Albertini and Alberto Bernardini and Federico
                 Borra and Fabio Antonacci and Augusto Sarti",
  title =        "Two-Stage Beamforming With Arbitrary Planar Arrays of
                 Differential Microphone Array Units",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "590--602",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Differential Microphone Arrays (DMAs) are of great
                 interest in the literature on small-sized microphone
                 arrays, due to their good directivity properties and
                 nearly frequency-invariant spatial responses. Recently
                 developed beamforming techniques combine \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi-Syuan Chen and Yun-Zhu Song and Hong-Han Shuai",
  title =        "{SPEC}: Summary Preference Decomposition for
                 Low-Resource Abstractive Summarization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "603--618",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Neural abstractive summarization has been widely
                 studied and achieved great success with large-scale
                 corpora. However, the considerable cost of annotating
                 data motivates the need for learning strategies under
                 low-resource settings. In this paper, we \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yingying Xiao and Shanmou Chen and Qiangqiang Zhang
                 and Dongyuan Lin and Minglin Shen and Junhui Qian and
                 Shiyuan Wang",
  title =        "Generalized Hyperbolic Tangent Based Random {Fourier}
                 Conjugate Gradient Filter for Nonlinear Active Noise
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "619--632",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "The filtered-x least mean square (FxLMS) algorithm has
                 been proposed for an active noise control (ANC) system.
                 However, due to the used mean square error (MSE)
                 criterion, FxLMS suffers from performance degeneration
                 for non-Gaussian noises, dramatically. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jun Qi and Chao-Han Huck Yang and Pin-Yu Chen and
                 Javier Tejedor",
  title =        "Exploiting Low-Rank Tensor-Train Deep Neural Networks
                 Based on {Riemannian} Gradient Descent With
                 Illustrations of Speech Processing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "633--642",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "This work focuses on designing low-complexity hybrid
                 tensor networks by considering trade-offs between the
                 model complexity and practical performance. Firstly, we
                 exploit a low-rank tensor-train deep neural network
                 (TT-DNN) to build an end-to-end deep \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bin Gu and Wu Guo and Jie Zhang",
  title =        "Memory Storable Network Based Feature Aggregation for
                 Speaker Representation Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "643--655",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Learning fixed-dimensional speaker representation
                 using deep neural networks is a key step in speaker
                 verification. In this work, we propose an auxiliary
                 memory storable network (MSN) to assist a backbone
                 network for learning discriminative features,
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Takumi Abe and Shoichi Koyama and Natsuki Ueno and
                 Hiroshi Saruwatari",
  title =        "Amplitude Matching for Multizone Sound Field Control",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "656--669",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "A multizone sound field control method, called
                 amplitude matching, is proposed. The objective of
                 amplitude matching is to synthesize a desired amplitude
                 (or magnitude) distribution over a target region with
                 multiple loudspeakers, whereas the phase \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mahdi Barhoush and Ahmed Hallawa and Arne Peine and
                 Lukas Martin and Anke Schmeink",
  title =        "Localization-Driven Speech Enhancement in Noisy
                 Multi-Speaker Hospital Environments Using Deep Learning
                 and Meta Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "670--683",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "This work addresses the problem of 3D-localizing and
                 enhancing the speech of one main speaker in noisy
                 multi-speaker hospital environments using a
                 multi-channel microphone array. In our model, we
                 propose conducting speaker localization using a machine
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Herman Kamper",
  title =        "Word Segmentation on Discovered Phone Units With
                 Dynamic Programming and Self-Supervised Scoring",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "684--694",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Recent work on unsupervised speech segmentation has
                 used self-supervised models with phone and word
                 segmentation modules that are trained jointly. This
                 paper instead revisits an older approach to word
                 segmentation: bottom-up phone-like unit discovery is
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Changheng Li and Jorge Martinez and Richard Christian
  title =        "Joint Maximum Likelihood Estimation of Microphone
                 Array Parameters for a Reverberant Single Source
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "695--705",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Estimation of the acoustic-scene related parameters
                 such as relative transfer functions (RTFs) from source
                 to microphones, source power spectral densities (PSDs)
                 and PSDs of the late reverberation is essential and
                 also challenging. Existing maximum \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shota Horiguchi and Shinji Watanabe and Paola
                 Garc{\'\i}a and Yuki Takashima and Yohei Kawaguchi",
  title =        "Online Neural Diarization of Unlimited Numbers of
                 Speakers Using Global and Local Attractors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "706--720",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "A method to perform offline and online speaker
                 diarization for an unlimited number of speakers is
                 described in this paper. End-to-end neural diarization
                 (EEND) has achieved overlap-aware speaker diarization
                 by formulating it as a multi-label \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ling He and Jia Fu and Yuanyuan Li and Xi Xiong and
                 Jing Zhang",
  title =        "{WNSA-Net}: an Axial-Attention-Based Network for
                 Schizophrenia Detection Using Wideband and Narrowband
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "721--733",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Schizophrenia is a severe mental disease that affects
                 patients\&\#x0027; thoughts, feelings, and behaviors.
                 Speech signal has proven to be a biomarker in the early
                 diagnosis of schizophrenia. Previous studies on
                 schizophrenic speech detection are mainly \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anusha Prakash and Hema A. Murthy",
  title =        "Exploring the Role of Language Families for Building
                 Indic Speech Synthesisers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "734--747",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Building end-to-end speech synthesisers for Indian
                 languages is challenging, given the lack of adequate
                 clean training data and multiple grapheme
                 representations across languages. This work explores
                 the importance of training multilingual and multi-.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mahdin Rohmatillah and Jen-Tzung Chien",
  title =        "Hierarchical Reinforcement Learning With Guidance for
                 Multi-Domain Dialogue Policy",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "748--761",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Achieving high performance in a multi-domain dialogue
                 system with low computation is undoubtedly challenging.
                 Previous works applying an end-to-end approach have
                 been very successful. However, the computational cost
                 remains a major issue since the large-. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shahram Ghorbani and John H. L. Hansen",
  title =        "Domain Expansion for End-to-End Speech Recognition:
                 Applications for {Accent\slash} Dialect Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "762--774",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Training Automatic Speech Recognition (ASR) systems
                 with sequentially incoming data from alternate domains
                 is an essential milestone in order to reach human
                 intelligibility level in speech recognition. The main
                 challenge of sequential learning is that \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Weidong Chen and Xiaofen Xing and Xiangmin Xu and
                 Jianxin Pang and Lan Du",
  title =        "{SpeechFormer++}: a Hierarchical Efficient Framework
                 for Paralinguistic Speech Processing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "775--788",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Paralinguistic speech processing is important in
                 addressing many issues, such as sentiment and
                 neurocognitive disorder analyses. Recently, Transformer
                 has achieved remarkable success in the natural language
                 processing field and has demonstrated its \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Nicki Holighaus and G{\"u}nther Koliander and Clara
                 Hollomey and Friedrich Pillichshammer",
  title =        "Grid-Based Decimation for Wavelet Transforms With
                 Stably Invertible Implementation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "789--801",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "The constant center frequency to bandwidth ratio
                 (Q-factor) of wavelet transforms provides a very
                 natural representation for audio data. However,
                 invertible wavelet transforms have either required
                 non-uniform decimation\&\#x2014;leading to irregular
                 data \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Weiwei Lin and Man-Wai Mak",
  title =        "Robust Speaker Verification Using Deep Weight Space
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "802--812",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Domain shift is one of the most challenging problems
                 in speaker verification. Although numerous methods have
                 been proposed to address domain shift, most approaches
                 optimize the performance of one domain at the sacrifice
                 of the other. As a result, to \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lin Zhang and Xin Wang and Erica Cooper and Nicholas
                 Evans and Junichi Yamagishi",
  title =        "The {PartialSpoof} Database and Countermeasures for
                 the Detection of Short Fake Speech Segments Embedded in
                 an Utterance",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "813--825",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Automatic speaker verification is susceptible to
                 various manipulations and spoofing, such as
                 text-to-speech synthesis, voice conversion, replay,
                 tampering, adversarial attacks, and so on. We consider
                 a new spoofing scenario called {$<$
                 italic$>$}\&\#x201C;Partial \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jie Mei and Yufan Wang and Xinhui Tu and Ming Dong and
                 Tingting He",
  title =        "Incorporating {BERT} With Probability-Aware Gate for
                 Spoken Language Understanding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "826--834",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Spoken language understanding (SLU) is an essential
                 part of a task-oriented dialogue system, which mainly
                 includes intent detection and slot filling. Some
                 existing approaches obtain enhanced semantic
                 representation by establishing the correlation between
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tsubasa Ochiai and Marc Delcroix and Tomohiro Nakatani
                 and Shoko Araki",
  title =        "Mask-Based Neural Beamforming for Moving Speakers With
                 Self-Attention-Based Tracking",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "835--848",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Beamforming is a powerful tool designed to enhance
                 speech signals from the direction of a target source.
                 Computing the beamforming filter requires estimating
                 spatial covariance matrices (SCMs) of the source and
                 noise signals. Time-frequency masks are \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rongzhi Gu and Shi-Xiong Zhang and Yuexian Zou and
                 Dong Yu",
  title =        "Towards Unified All-Neural Beamforming for Time and
                 Frequency Domain Speech Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "849--862",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Recently, frequency domain all-neural beamforming
                 methods have achieved remarkable progress for
                 multichannel speech separation. In parallel, the
                 integration of time domain network structure and
                 beamforming also gains significant attention. This
                 study \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Naotake Masuda and Daisuke Saito",
  title =        "Improving Semi-Supervised Differentiable Synthesizer
                 Sound Matching for Practical Applications",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "863--875",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "While synthesizers have become commonplace in music
                 production, many users find it difficult to control the
                 parameters of a synthesizer to create a sound as they
                 intended. In order to assist the user, the {$<$
                 italic$>$ sound} {matching$<$}/{italic$>$} task aims to
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Erfan Loweimi and Zhengjun Yue and Peter Bell and
                 Steve Renals and Zoran Cvetkovic",
  title =        "Multi-Stream Acoustic Modelling Using Raw Real and
                 Imaginary Parts of the {Fourier} Transform",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "876--890",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, we investigate multi-stream acoustic
                 modelling using the raw real and imaginary parts of the
                 Fourier transform of speech signals. Using the raw
                 magnitude spectrum, or features derived from it, as a
                 proxy for the real and imaginary parts \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bengt J. Borgstr{\"o}m",
  title =        "A Generative Approach to Condition-Aware Score
                 Calibration for Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "891--901",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "In speaker verification, score calibration is employed
                 to transform verification scores to log-likelihood
                 ratios (LLRs) which are statistically interpretable.
                 Conventional calibration techniques apply a global
                 score transform. However, in condition-aware \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Irene Mart{\'\i}n-Morat{\'o} and Annamaria Mesaros",
  title =        "Strong Labeling of Sound Events Using Crowdsourced
                 Weak Labels and Annotator Competence Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "902--914",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Crowdsourcing is a popular tool for collecting large
                 amounts of annotated data, but the specific format of
                 the strong labels necessary for sound event detection
                 is not easily obtainable through crowdsourcing. In this
                 work, we propose a novel annotation \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wenzhao Zhu and Lei Luo and Jinwei Sun and Mads
                 Gr{\ae}sb{\o}ll Christensen",
  title =        "A New Virtual Tracking Sub-Algorithm Based Hybrid
                 Active Control System for Narrowband Noise With
                 Impulsive Interference",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "915--926",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Mechanical noise is usually a mixture of narrowband
                 and impulsive noise which needs complex active noise
                 control (ANC) algorithms to improve the de-noising
                 performance. But the ANC algorithm with a high
                 computation load will reduce the real-time \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Thomas Deppisch and Sebasti{\`a} V. Amengual Gar{\'\i}
                 and Paul Calamia and Jens Ahrens",
  title =        "Direct and Residual Subspace Decomposition of Spatial
                 Room Impulse Responses",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "927--942",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Psychoacoustic experiments have shown that directional
                 properties of the direct sound, salient reflections,
                 and the late reverberation of an acoustic room response
                 can have a distinct influence on the auditory
                 perception of a given room. Spatial room \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Eloi Moliner and Vesa V{\"a}lim{\"a}ki",
  title =        "{BEHM-GAN}: Bandwidth Extension of Historical Music
                 Using Generative Adversarial Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "943--956",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Audio bandwidth extension aims to expand the spectrum
                 of bandlimited audio signals. Although this topic has
                 been broadly studied during recent years, the
                 particular problem of extending the bandwidth of
                 historical music recordings remains an open \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Martin J{\"a}lmby and Filip Elvander and Toon van
  title =        "Low-Rank Room Impulse Response Estimation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "957--969",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper we consider low-rank estimation of room
                 impulse responses (RIRs). Inspired by a physics-driven
                 room-acoustical model, we propose an estimator of RIRs
                 that promotes a low-rank structure for a matricization,
                 or reshaping, of the estimated RIR. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hong Liu and Yucheng Cai and Zhenru Lin and Zhijian Ou
                 and Yi Huang and Junlan Feng",
  title =        "Variational Latent-State {GPT} for Semi-Supervised
                 Task-Oriented Dialog Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "970--984",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Recently, two approaches, fine-tuning large
                 pre-trained language models and variational training,
                 have attracted significant interests, separately, for
                 semi-supervised end-to-end task-oriented dialog (TOD)
                 systems. In this paper, we propose Variational
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "De Hu and Qintuya Si and Rui Liu and Feilong Bao",
  title =        "Distributed Sensor Selection for Speech Enhancement
                 With Acoustic Sensor Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "985--999",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "In distributed acoustic sensor networks, only a few
                 nodes make a significant contribution to speech
                 enhancement tasks. Using these most informative nodes
                 instead of the entire network not only avoids
                 unnecessary energy consumption but also prolongs the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yingke Zhu and Brian Mak",
  title =        "{Bayesian} Self-Attentive Speaker Embeddings for
                 Text-Independent Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1000--1012",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Learning effective and discriminative speaker
                 embeddings is a crucial task in speaker verification.
                 Usually, speaker embeddings are extracted from a
                 speaker-classification DNN that averages the hidden
                 vectors over all the spoken frames of a speaker; the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuying Li and Yuchen Liu and Donald S. Williamson",
  title =        "A Composite {T60} Regression and Classification
                 Approach for Speech Dereverberation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1013--1023",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Dereverberation is often performed directly on the
                 reverberant audio signal, without knowledge of the
                 acoustic environment. Reverberation time, \ldots{},
                 however, is an essential \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hanyi Zhang and Longbiao Wang and Kong Aik Lee and
                 Meng Liu and Jianwu Dang and Helen Meng",
  title =        "Meta-Generalization for Domain-Invariant Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1024--1036",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Automatic speaker verification (ASV) exhibits
                 unsatisfactory performance under domain mismatch
                 conditions owing to intrinsic and extrinsic factors,
                 such as variations in speaking styles and recording
                 devices encountered in real-world applications. To
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shu-Tong Niu and Jun Du and Lei Sun and Yu Hu and
                 Chin-Hui Lee",
  title =        "{QDM-SSD}: Quality-Aware Dynamic Masking for
                 Separation-Based Speaker Diarization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1037--1049",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "We improve iterative separation-based speaker
                 diarization (ISSD) with quality-aware dynamic masking
                 (QDM). We call the proposed framework QDM-SSD. Compared
                 with ISSD, QDM-SSD enhances the simulated data used for
                 model adaptation through QDM to alleviate \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Boyang Lyu and Chunxiao Fan and Yue Ming and Panzi
                 Zhao and Nannan Hu",
  title =        "{En-HACN}: Enhancing Hybrid Architecture With Fast
                 Attention and Capsule Network for End-to-end Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1050--1062",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Automatic speech recognition (ASR) is a fundamental
                 technology in the field of artificial intelligence.
                 End-to-end (E2E) ASR is favored for its
                 state-of-the-art performance. However, E2E speech
                 recognition still faces speech spatial information loss
                 and \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yang Liu and Haoqin Sun and Wenbo Guan and Yuqi Xia
                 and Yongwei Li and Masashi Unoki and Zhen Zhao",
  title =        "A Discriminative Feature Representation Method Based
                 on Cascaded Attention Network With Adversarial Strategy
                 for Speech Emotion Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1063--1074",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Currently, speech emotion recognition models still
                 could not show satisfactory performance due to the
                 complexity of emotions. In most of the previous
                 studies, there is a common problem that some of the
                 particular emotions are severely misclassified. In
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hao Zhang and Nianwen Si and Yaqi Chen and Wenlin
                 Zhang and Xukui Yang and Dan Qu and Wei-Qiang Zhang",
  title =        "Improving Speech Translation by Cross-Modal
                 Multi-Grained Contrastive Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1075--1086",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "The end-to-end speech translation (E2E-ST) model has
                 gradually become a mainstream paradigm due to its low
                 latency and less error propagation. However, it is
                 non-trivial to train such a model well due to the task
                 complexity and data scarcity. The speech-. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wei-Cheng Lin and Carlos Busso",
  title =        "Sequential Modeling by Leveraging Non-Uniform
                 Distribution of Speech Emotion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1087--1099",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "The expression and perception of human emotions are
                 not uniformly distributed over time. Therefore,
                 tracking local changes of emotion within a segment can
                 lead to better models for {$<$ italic$>$ speech}
                 emotion {recognition$<$}/{italic$>$} (SER), even when
                 the task is \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Achyut Mani Tripathi and Om Jee Pandey",
  title =        "Divide and Distill: New Outlooks on Knowledge
                 Distillation for Environmental Sound Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1100--1113",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Environmental sound classification (ESC) is an
                 important research problem with a broad range of
                 applications including audio-based surveillance,
                 audio-visual systems, smart homes, and robotics, among
                 others. The recently proposed vision multi-layer
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hao Zhang and Ashutosh Pandey and De Liang Wang",
  title =        "Low-Latency Active Noise Control Using Attentive
                 Recurrent Network",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1114--1123",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Processing latency is a critical issue for active
                 noise control (ANC) due to the causality constraint of
                 ANC systems. This paper addresses low-latency ANC in
                 the context of deep learning (i.e. deep ANC). A
                 time-domain method using an attentive recurrent
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Avital Bross and Sharon Gannot",
  title =        "Training-Based Multiple Source Tracking Using
                 Manifold-Learning and Recursive
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1124--1140",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper we propose a data-driven approach for
                 multiple speaker tracking in reverberant enclosures.
                 The speakers are uttering, possibly overlapping, speech
                 signals while moving in the environment. The method
                 comprises two stages. The first stage \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Guimin Hu and Yi Zhao and Guangming Lu",
  title =        "Emotion Prediction Oriented Method With Multiple
                 Supervisions for Emotion-Cause Pair Extraction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1141--1152",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Emotion-cause pair extraction (ECPE) task aims to
                 extract all the pairs of emotions and their causes from
                 an unannotated emotion text. The previous works usually
                 extract the emotion-cause pairs from two perspectives
                 of emotion and cause. However, emotion \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Reza Mohsenipour and Daniel Massicotte and Wei-Ping
  title =        "{PI} Control of Loudspeakers Based on Linear
                 Fractional Order Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1153--1162",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "This paper aims at the proportional-integral (PI)
                 control of the cone vibration of the electrodynamic
                 loudspeakers system recently described using a linear
                 fractional order model. After introducing the
                 fractional order model of the circuit of these
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tim L{\"u}beck and Johannes M. Arend and Christoph
  title =        "Spatial Upsampling of Sparse Spherical Microphone
                 Array Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1163--1174",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "We present a method for spatial upsampling of signals
                 captured with spherical microphone arrays with a
                 limited number of microphones. The upsampling is
                 performed by adding virtual microphone signals using
                 interpolation between the measured array signals.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiajun Deng and Xurong Xie and Tianzi Wang and Mingyu
                 Cui and Boyang Xue and Zengrui Jin and Guinan Li and
                 Shujie Hu and Xunying Liu",
  title =        "Confidence Score Based Speaker Adaptation of Conformer
                 Speech Recognition Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1175--1190",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Speaker adaptation techniques provide a powerful
                 solution to customise automatic speech recognition
                 (ASR) systems for individual users. Practical
                 application of unsupervised model-based speaker
                 adaptation techniques to data intensive end-to-end ASR
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hongsheng Zhang and Jizhang Gan and Ting Liu and Kui
                 Huang and Hong Yang",
  title =        "Coefficients-Switched Normalized Least-Mean- Squares
                 Adaption in Echo Canceler of Sparse-Echo-Path",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1191--1199",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "The Normalized Least-Mean-Squares (NLMS) algorithm
                 commonly used in echo cancelers suffers from a number
                 of limitations due to the existing sparsity in the echo
                 path. Although some sparsity-aware algorithms have been
                 proposed, the high computational \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Eric Guizzo and Tillman Weyde and Simone Scardapane
                 and Danilo Comminiello",
  title =        "Learning Speech Emotion Representations in the
                 Quaternion Domain",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1200--1212",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "The modeling of human emotion expression in speech
                 signals is an important, yet challenging task. The high
                 resource demand of speech emotion recognition models,
                 combined with the general scarcity of emotion-labelled
                 data are obstacles to the development \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiaqi Bai and Ze Yang and Jian Yang and Hongcheng Guo
                 and Zhoujun Li",
  title =        "{KINet}: Incorporating Relevant Facts Into
                 Knowledge-Grounded Dialog Generation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1213--1222",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "Knowledge-grounded conversation has led to great
                 progress in producing informative dialog responses by
                 leveraging external knowledge. This work focuses on two
                 affiliated knowledge grounded conversation tasks: {$<$
                 italic$>$Knowledge} {Selection$<$}/{italic$>$} and
                 {$<$}. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Haiquan Zhao and Yuan Gao and Yingying Zhu",
  title =        "Robust Subband Adaptive Filter Algorithms-Based
                 Mixture Correntropy and Application to Acoustic Echo
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1223--1233",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  ISSN-L =       "2329-9290",
  bibdate =      "Wed May 17 14:29:03 MDT 2023",
  bibsource =    "",
  URL =          "",
  abstract =     "To acquire an improvement of the performance of the
                 subband adaptive filter with impulsive interference,
                 the normalized subband adaptive filter (NSAF)
                 algorithm-based maximum correntropy criterion (MCC),
                 called MCC-NSAF, has been developed. However, it is
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chen Zhang and Luis Fernando D'Haro and Qiquan Zhang
                 and Thomas Friedrichs and Haizhou Li",
  title =        "{PoE}: a Panel of Experts for Generalized Automatic
                 Dialogue Assessment",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1234--1250",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Chatbots are expected to be knowledgeable across
                 multiple domains, e.g. for daily chit-chat, exchange of
                 information, and grounding in emotional situations. To
                 effectively measure the quality of such conversational
                 agents, a model-based automatic dialogue \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qing Wang and Jun Du and Hua-Xin Wu and Jia Pan and
                 Feng Ma and Chin-Hui Lee",
  title =        "A Four-Stage Data Augmentation Approach to
                 {ResNet-Conformer} Based Acoustic Modeling for Sound
                 Event Localization and Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1251--1264",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, we propose a novel four-stage data
                 augmentation approach to ResNet-Conformer based
                 acoustic modeling for sound event localization and
                 detection (SELD). First, we explore two spatial
                 augmentation techniques, namely audio channel swapping
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yingwen Fu and Nankai Lin and Xiaohui Yu and Shengyi
  title =        "Self-Training With Double Selectors for Low-Resource
                 Named Entity Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1265--1275",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Named Entity Recognition (NER) is fundamental to
                 multiple downstream natural language processing (NLP)
                 tasks, but most advanced NER methods heavily rely on
                 massive labeled data with high cost. In this paper, we
                 explore the effectiveness of self-training \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kilian Schulze-Forster and Ga{\"e}l Richard and Liam
                 Kelley and Clement S. J. Doire and Roland Badeau",
  title =        "Unsupervised Music Source Separation Using
                 Differentiable Parametric Source Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1276--1289",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Supervised deep learning approaches to underdetermined
                 audio source separation achieve state-of-the-art
                 performance but require a dataset of mixtures along
                 with their corresponding isolated source signals. Such
                 datasets can be extremely costly to obtain \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yinggang Liu and Hong Fu and Ying Wei and Hanbing
  title =        "Sound Event Classification Based on Frequency-Energy
                 Feature Representation and Two-Stage Data Dimension
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1290--1304",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The classification of environmental sound events is of
                 great significance for applications such as machine
                 hearing and acoustic surveillance. Feature
                 representation and feature vector dimension directly
                 affect system performance. To better extract \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ege Erdem and Zoran Cvetkovi{\'c} and H{\"u}seyin
  title =        "{$3$D} Perceptual Soundfield Reconstruction via
                 Virtual Microphone Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1305--1317",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Perceptual soundfield reconstruction (PSR) is a
                 multichannel audio recording and reproduction framework
                 based on time-intensity panning in the horizontal
                 plane. A practical limitation of PSR is that the
                 optimal directivity patterns required by the system
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dongyuan Shi and Woon-Seng Gan and Bhan Lam and Xiaoyi
  title =        "A Frequency-Domain Output-Constrained Active Noise
                 Control Algorithm Based on an Intuitive Circulant
                 Convolutional Penalty Factor",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1318--1332",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Due to their computational efficiency, least mean
                 square (LMS)-based algorithms are still widely utilized
                 to achieve optimal control in active noise control
                 (ANC) applications. Real-world implementation of
                 advanced ANC functionalities, such as \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Muhammed Zahid Ozturk and Chenshu Wu and Beibei Wang
                 and Min Wu and K. J. Ray Liu",
  title =        "{RadioSES}: {mmWave}-Based Audioradio Speech
                 Enhancement and Separation System",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1333--1347",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech enhancement and separation have been a
                 long-standing problem, especially with the recent
                 advances using a single microphone. Although
                 microphones perform well in constrained settings, their
                 performance for speech separation decreases in noisy
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jianwei Zhang and Julie Liss and Suren Jayasuriya and
                 Visar Berisha",
  title =        "Robust Vocal Quality Feature Embeddings for Dysphonic
                 Voice Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1348--1359",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Approximately 1.2\% of the world's population has
                 impaired voice production. As a result, automatic
                 dysphonic voice detection has attracted considerable
                 academic and clinical interest. However, existing
                 methods for automated voice assessment \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ashutosh Pandey and DeLiang Wang",
  title =        "Attentive Training: a New Training Framework for
                 Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1360--1370",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Dealing with speech interference in a speech
                 enhancement system requires either speaker separation
                 or target speaker extraction. Speaker separation has
                 multiple output streams with arbitrary assignments
                 while target speaker extraction requires additional
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hirofumi Inaguma and Tatsuya Kawahara",
  title =        "Alignment Knowledge Distillation for Online Streaming
                 Attention-Based Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1371--1385",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This article describes an efficient training method
                 for online streaming attention-based encoder-decoder
                 (AED) automatic speech recognition (ASR) systems. AED
                 models have achieved competitive performance in offline
                 scenarios by jointly optimizing all \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mittapalle Kiran Reddy and Paavo Alku",
  title =        "Exemplar-Based Sparse Representations for Detection of
                 {Parkinson}'s Disease From Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1386--1396",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Parkinson's disease (PD) is a progressive neurological
                 disorder which affects the motor system. The automatic
                 detection of PD improves the diagnosis of the disease,
                 and it can be done in a non-invasive manner from
                 speech. In this paper, we \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shunsuke Kita and Yoshinobu Kajikawa",
  title =        "Sound Source Localization Inside a Structure Under
                 Semi-Supervised Conditions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1397--1408",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "We propose a method for applying a sound source
                 localization (SSL) model trained on simulated data in a
                 real-world environment, with a domain transfer (DT)
                 model for the SSL inside a structure. The DT model
                 transfers real data into pseudo-simulation data.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Guowei Wu and Shipei Liu and Xiaoya Fan",
  title =        "The Power of Fragmentation: a Hierarchical Transformer
                 Model for Structural Segmentation in Symbolic Music
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1409--1420",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Symbolic music generation relies on the contextual
                 representation capabilities of the generative model,
                 where the most prevalent approach is the
                 Transformer-based model. Learning contextual
                 representations are also related to the structural
                 elements in \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xueqin Luo and Gongping Huang and Jilu Jin and
                 Jingdong Chen and Jacob Benesty and Wen Zhang and
                 Mengyao Zhu and Chunjian Li",
  title =        "Design of Maximum Directivity Beamformers With Linear
                 Acoustic Vector Sensor Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1421--1435",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This paper studies the design of maximum directivity
                 factor (MDF) beamformers based on uniform linear arrays
                 (ULAs) consisting of acoustic vector sensors (AVSs). We
                 first derive the main lobe constraints, which ensure
                 that the beamformer's \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ruchao Fan and Wei Chu and Peng Chang and Abeer
  title =        "A {CTC} Alignment-Based Non-Autoregressive Transformer
                 for End-to-End Automatic Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1436--1448",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Recently, end-to-end models have been widely used in
                 automatic speech recognition (ASR) systems. Two of the
                 most representative approaches are connectionist
                 temporal classification (CTC) and attention-based
                 encoder-decoder (AED) models. Autoregressive \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tianyou Li and Siyuan Lian and Sipei Zhao and Jing Lu
                 and Ian S. Burnett",
  title =        "Distributed Active Noise Control Based on an Augmented
                 Diffusion {FxLMS} Algorithm",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1449--1463",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Multichannel active noise control (ANC) systems have
                 been widely investigated for low-frequency noise
                 attenuation over a spatial region. Using a conventional
                 centralized control strategy based on the multichannel
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiayuan Xie and Wenhao Fang and Qingbao Huang and Yi
                 Cai and Tao Wang",
  title =        "Enhancing Paraphrase Question Generation With Prior
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1464--1475",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Paraphrase question generation (PQG) aims to rewrite a
                 given original question to a new paraphrase question,
                 where the paraphrase question needs to have the same
                 expressed meaning as the original question, but have a
                 difference in expression form. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chen Chen and Hansheng Hong and Jie Guo and Bin Song",
  title =        "Inter- Intra Modal Representation Augmentation With
                 Trimodal Collaborative Disentanglement Network for
                 Multimodal Sentiment Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1476--1488",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Recently, Multimodal Sentiment Analysis (MSA) is a
                 challenging research area given its complex nature, and
                 humans express emotional cues across various modalities
                 such as language, facial expressions, and speech.
                 Representation and fusion of features are \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jian Yang and Yuwei Yin and Liqun Yang and Shuming Ma
                 and Haoyang Huang and Dongdong Zhang and Furu Wei and
                 Zhoujun Li",
  title =        "{GTrans}: Grouping and Fusing Transformer Layers for
                 Neural Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1489--1498",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Transformer structure, stacked by a sequence of
                 encoder and decoder network layers, achieves
                 significant development in neural machine translation.
                 However, vanilla Transformer mainly exploits the
                 top-layer representation, assuming the lower layers
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xin Wu and Yi Cai and Zetao Lian and Ho-fung Leung and
                 Tao Wang",
  title =        "Generating Natural Language From Logic Expressions
                 With Structural Representation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1499--1510",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Incorporating logic reasoning with deep neural
                 networks (DNNs) is an important challenge in machine
                 learning. In this article, we study the problem of
                 converting logical expressions into natural language.
                 In particular, given a sequential logic expression,.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi Li and Yang Sun and Wenwu Wang and Syed Mohsen
  title =        "U-Shaped Transformer With Frequency-Band Aware
                 Attention for Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1511--1521",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Recently, Transformer shows the potential to exploit
                 the long-range sequence dependency in speech with
                 self-attention. It has been introduced in single
                 channel speech enhancement to improve the accuracy of
                 speech estimation from a noise mixture. However,
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Christian Anto{\~n}anzas and Miguel Ferrer and Maria
                 de Diego and Alberto Gonzalez",
  title =        "Remote Microphone Technique for Active Noise Control
                 Over Distributed Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1522--1535",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Multichannel Active Noise Control (ANC) headrest
                 systems have usually been designed with the objective
                 of creating quiet areas at the passenger positions
                 within the cabin of a public transport. Due to the high
                 computational demands of dealing with \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi Zhu and Abhishek Tiwari and Jo{\~a}o Monteiro and
                 Shruti Kshirsagar and Tiago Henrique Falk",
  title =        "{COVID-19} Detection via Fusion of Modulation Spectrum
                 and Linear Prediction Speech Features",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1536--1549",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The coronavirus disease 2019 (COVID-19) pandemic has
                 drastically impacted life around the globe. As life
                 returns to pre-pandemic routines, COVID-19 testing has
                 become a key component, assuring that travellers and
                 citizens are free from the disease. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jijie Li and Kai Shuang and Jinyu Guo and Zengyi Shi
                 and Hongman Wang",
  title =        "Enhancing Semantic Relation Classification With
                 Shortest Dependency Path Reasoning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1550--1560",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Relation Classification (RC) is a basic and essential
                 task of Natural Language Processing. Existing RC
                 methods can be classified into two categories:
                 sequence-based methods and dependency-based methods.
                 Sequence-based methods identify the target relation
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mao-Kui He and Jun Du and Qing-Feng Liu and Chin-Hui
  title =        "{ANSD-MA-MSE}: Adaptive Neural Speaker Diarization
                 Using Memory-Aware Multi-Speaker Embedding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1561--1573",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, we propose a neural speaker diarization
                 (NSD) network architecture consisting of three key
                 components. First, a memory-aware multi-speaker
                 embedding (MA-MSE) mechanism is proposed to facilitate
                 a dynamical refinement of speaker embedding to
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Longting Xu and Jichen Yang and Chang Huai You and
                 Xinyuan Qian and Daiyu Huang",
  title =        "Device Features Based on Linear Transformation With
                 Parallel Training Data for Replay Speech Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1574--1586",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Replay speech poses a growing threat to speaker
                 verification systems, thus the detection of replay
                 speech becomes increasingly important. A critical
                 factor differentiating replay speech and genuine speech
                 is the representation of device information. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Huajian Fang and Dennis Becker and Stefan Wermter and
                 Timo Gerkmann",
  title =        "Integrating Uncertainty Into Neural Network-Based
                 Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1587--1600",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Supervised masking approaches in the time-frequency
                 domain aim to employ deep neural networks to estimate a
                 multiplicative mask to extract clean speech. This leads
                 to a single estimate for each input without any
                 guarantees or measures of reliability. In \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Libo Qin and Xiao Xu and Lehan Wang and Yue Zhang and
                 Wanxiang Che",
  title =        "Modularized Pre-Training for End-to-End Task-Oriented
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1601--1610",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hanlei Zhang and Hua Xu and Shaojie Zhao and Qianrui
  title =        "Learning Discriminative Representations and Decision
                 Boundaries for Open Intent Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1611--1623",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Open intent detection is a significant problem in
                 natural language understanding, which aims to identify
                 the unseen open intent while ensuring known intent
                 identification performance. However, current methods
                 face two major challenges. Firstly, they \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Guangsheng Bao and Yue Zhang",
  title =        "A General Contextualized Rewriting Framework for Text
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1624--1635",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The rewriting method for text summarization combines
                 the advantage of extractive and abstractive approaches,
                 improving the conciseness and readability of extractive
                 summaries. Exiting rewriting systems take extractive
                 sentences as the only input and \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Christoph Kirsch and Stephan D. Ewert",
  title =        "A Universal Filter Approximation of Edge Diffraction
                 for Geometrical Acoustics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1636--1651",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Sound propagation in urban and indoor environments
                 often involves diffraction at corners, finite objects
                 and openings, resulting in perceptually relevant
                 frequency-dependent attenuation. Geometrical acoustics
                 (GA) has become a de-facto standard for the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Peyman Goli and Steven van de Par",
  title =        "Deep Learning-Based Speech Specific Source
                 Localization by Using Binaural and Monaural Microphone
                 Arrays in Hearing Aids",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1652--1666",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "A deep learning-based method is proposed for jointly
                 detecting and localizing speech sources in a complex
                 acoustic scene by using microphones of a hearing aid.
                 Motivated by the human auditory system, peripheral
                 preprocessing is applied on the microphone \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Nguyen Binh Thien and Yukoh Wakabayashi and Kenta Iwai
                 and Takanobu Nishiura",
  title =        "Inter-Frequency Phase Difference for Phase
                 Reconstruction Using Deep Neural Networks and Maximum
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1667--1680",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This paper presents improvements to two-stage
                 algorithms for estimating the short-time Fourier
                 transform (STFT) phase from only the amplitude by using
                 deep neural networks (DNNs). The phase is difficult to
                 reconstruct due to its sensitivity to the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Srikanth Raj Chetupalli and Emanu{\"e}l A. P. Habets",
  title =        "Speaker Counting and Separation From Single-Channel
                 Noisy Mixtures",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1681--1692",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "We address the problem of speaker counting and
                 separation from a noisy, single-channel, multi-source,
                 recording. Most of the works in the literature assume
                 mixtures containing two to five speakers. In this work,
                 we consider noisy speech mixtures with one \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Guangyan Zhang and Ying Qin and Wenjie Zhang and
                 Jialun Wu and Mei Li and Yutao Gai and Feijun Jiang and
                 Tan Lee",
  title =        "{iEmoTTS}: Toward Robust Cross-Speaker Emotion
                 Transfer and Control for Speech Synthesis Based on
                 Disentanglement Between Prosody and Timbre",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1693--1705",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Cross- speaker emotion transfer is a common approach
                 to generating emotional speech when speech data with
                 emotion labels from target speakers is not available.
                 This paper presents a novel cross-speaker emotion
                 transfer system named iEmoTTS. The system is \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ruijie Tao and Kong Aik Lee and Rohan Kumar Das and
                 Ville Hautam{\"a}ki and Haizhou Li",
  title =        "Self-Supervised Training of Speaker Encoder With
                 Multi-Modal Diverse Positive Pairs",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1706--1719",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "We study a novel neural speaker encoder and its
                 training strategies for speaker recognition without
                 using any identity labels. The speaker encoder is
                 trained to extract a fixed dimensional speaker
                 embedding from a spoken utterance of variable length.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dongchao Yang and Jianwei Yu and Helin Wang and Wen
                 Wang and Chao Weng and Yuexian Zou and Dong Yu",
  title =        "Diffsound: Discrete Diffusion Model for Text-to-Sound
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1720--1733",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Generating sound effects that people want is an
                 important topic. However, there are limited studies in
                 this area for sound generation. In this study, we
                 investigate generating sound conditioned on a text
                 prompt and propose a novel text-to-sound generation
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Paul Konstantin Krug and Peter Birkholz and Branislav
                 Gerazov and Daniel Rudolph van Niekerk and Anqi Xu and
                 Yi Xu",
  title =        "Artificial Vocal Learning Guided by Phoneme
                 Recognition and Visual Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1734--1744",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This paper introduces a paradigm shift regarding vocal
                 learning simulations, in which the communicative
                 function of speech acquisition determines the learning
                 process and intelligibility is considered the primary
                 measure of learning success. Thereby, a \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qian-Bei Hong and Chung-Hsien Wu and Hsin-Min Wang",
  title =        "Decomposition and Reorganization of Phonetic
                 Information for Speaker Embedding Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1745--1757",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech content is closely related to the stability of
                 speaker embeddings in speaker verification tasks. In
                 this paper, we propose a novel architecture based on
                 self-constraint learning (SCL) and reconstruction task
                 (RT) to remove the influence of phonetic \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wenbin Jiang and Kai Yu",
  title =        "Speech Enhancement With Integration of Neural
                 Homomorphic Synthesis and Spectral Masking",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1758--1770",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech enhancement refers to suppressing the
                 background noise to improve the perceptual quality and
                 intelligibility of the observed noisy speech. Recently,
                 speech enhancement algorithms based on deep neural
                 networks (DNNs) have replaced traditional \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shu'ang Li and Xuming Hu and Li Lin and Aiwei Liu and
                 Lijie Wen and Philip S. Yu",
  title =        "A Multi-Level Supervised Contrastive Learning
                 Framework for Low-Resource Natural Language Inference",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1771--1783",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Natural Language Inference (NLI) is a growingly
                 essential task in natural language understanding, which
                 requires inferring the relationship between the
                 sentence pairs \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaoqing Zheng",
  title =        "Building Conventional {``Experts''} With a Dialogue
                 Logic Programming Language",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1784--1796",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "We describe DiaProlog, a dialogue logic programming
                 language that extends the vanilla Prolog with the
                 features to facilitate the integration of reasoning
                 capabilities into task-oriented dialogue systems. The
                 extended language combines the expressive power
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Haitao Lin and Junnan Zhu and Lu Xiang and Feifei Zhai
                 and Yu Zhou and Jiajun Zhang and Chengqing Zong",
  title =        "Topic-Oriented Dialogue Summarization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1797--1810",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "A multi-turn dialogue often contains multiple
                 discussion topics. In several scenarios (e.g., customer
                 service dispute, public opinion monitoring), people are
                 only interested in the gist of a specific topic in the
                 dialogue. Therefore, we propose a novel \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Haohan Guo and Fenglong Xie and Xixin Wu and Frank K.
                 Soong and Helen Meng",
  title =        "{MSMC-TTS}: Multi-Stage Multi-Codebook {VQ-VAE} Based
                 Neural {TTS}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1811--1824",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This article aims to improve neural TTS with
                 vector-quantized, compact speech representations. We
                 propose a Vector-Quantized Variational AutoEncoder
                 (VQ-VAE) based feature analyzer to encode acoustic
                 features into sequences with different time
                 resolutions,. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bei Liu and Zhengyang Chen and Yanmin Qian",
  title =        "Depth-First Neural Architecture With Attentive Feature
                 Fusion for Efficient Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1825--1838",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Deep speaker embedding learning based on neural
                 networks has become the predominant approach in speaker
                 verification (SV) currently. In prior studies,
                 researchers have investigated various network
                 architectures. However, rare works pay attention to the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ria Ghosh and John H. L. Hansen",
  title =        "Bilateral Cochlear Implant Processing of Coding
                 Strategies With {CCi-MOBILE}, an Open-Source Research
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1839--1850",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "While speech understanding for cochlear implant (CI)
                 users in quiet is relatively effective, listeners
                 experience difficulty in identification of speaker and
                 sound location. To assist for better residual hearing
                 abilities and speech intelligibility \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Aolong Zhou and Wen Zhang and Guojun Xu and Xiaoyong
                 Li and Kefeng Deng and Junqiang Song",
  title =        "{DBSA-Net}: Dual Branch Self-Attention Network for
                 Underwater Acoustic Signal Denoising",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1851--1865",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Underwater acoustic signal denoising is a challenging
                 task due to the complexity of the underwater
                 environment. Most of the existing methods cannot
                 effectively cope with the problem of underwater
                 acoustic signal (UWAS) denoising at low signal-to-noise
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Weiwei Lin and Man-Wai Mak",
  title =        "Model-Agnostic Meta-Learning for Fast Text-Dependent
                 Speaker Embedding Adaptation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1866--1876",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "By constraining the lexical content of input speech,
                 text-dependent speaker verification (TD-SV) offers more
                 reliable performance than text-independent speaker
                 verification (TI-SV) when dealing with short
                 utterances. Because speech with constrained \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Andrea Galassi and Marco Lippi and Paolo Torroni",
  title =        "Multi-Task Attentive Residual Networks for Argument
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1877--1892",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "We explore the use of residual networks and neural
                 attention for multiple argument mining tasks. We
                 propose a residual architecture that exploits
                 attention, multi-task learning, and makes use of
                 ensemble, without any assumption on document or
                 argument \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi Luo and Jianwei Yu",
  title =        "Music Source Separation With Band-Split {RNN}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1893--1901",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The performance of music source separation (MSS)
                 models has been greatly improved in recent years thanks
                 to the development of novel neural network
                 architectures and training pipelines. However, recent
                 model designs for MSS were mainly motivated by other
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Keisuke Matsubara and Takuma Okamoto and Ryoichi
                 Takashima and Tetsuya Takiguchi and Tomoki Toda and
                 Hisashi Kawai",
  title =        "Harmonic-Net: Fundamental Frequency and Speech Rate
                 Controllable Fast Neural Vocoder",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1902--1915",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "There is a need to improve the synthesis quality of
                 HiFi-GAN-based real-time neural speech waveform
                 generative models on CPUs while preserving the
                 controllability of fundamental frequency \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi Zhou and Zhizheng Wu and Xiaohai Tian and Haizhou
  title =        "Optimization of Cross-Lingual Voice Conversion With
                 Linguistics Losses to Reduce Foreign Accents",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1916--1926",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Cross- lingual voice conversion (XVC) transforms the
                 speaker identity of a source speaker to that of a
                 target speaker who speaks a different language. Due to
                 the intrinsic differences between languages, the
                 converted speech may carry an unwanted foreign
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qiu-Shi Zhu and Jie Zhang and Zi-Qiang Zhang and
                 Li-Rong Dai",
  title =        "A Joint Speech Enhancement and Self-Supervised
                 Representation Learning Framework for Noise-Robust
                 Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1927--1939",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Though speech enhancement (SE) can be used to improve
                 speech quality in noisy environments, it may also cause
                 distortions that degrade the performance of automatic
                 speech recognition (ASR) models. Self-supervised
                 pre-training, on the other hand, has been \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Siqi Sun and Korin Richmond and Hao Tang",
  title =        "Improving {Seq2Seq} {TTS} Frontends With Transcribed
                 Speech Audio",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1940--1952",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Due to the data inefficiency and low speech quality of
                 grapheme-based end-to-end text-to-speech (TTS), having
                 a separate high-performance TTS linguistic frontend is
                 still commonly regarded as necessary. However, a TTS
                 frontend is itself difficult to build \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shih-Lun Wu and Yi-Hsuan Yang",
  title =        "{MuseMorphose}: Full-Song and Fine-Grained Piano Music
                 Style Transfer With One Transformer {VAE}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1953--1967",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Transformers and variational autoencoders (VAE) have
                 been extensively employed for symbolic (e.g., MIDI)
                 domain music generation. While the former boast an
                 impressive capability in modeling long sequences, the
                 latter allow users to willingly exert control
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaoxue Gao and Chitralekha Gupta and Haizhou Li",
  title =        "{PoLyScriber}: Integrated Fine-Tuning of Extractor and
                 Lyrics Transcriber for Polyphonic Music",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1968--1981",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Lyrics transcription of polyphonic music is
                 challenging as the background music affects lyrics
                 intelligibility. Typically, lyrics transcription can be
                 performed by a two-step pipeline, i.e. a singing vocal
                 extraction front end, followed by a lyrics \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhicheng Lian and Haonan Cheng and Jiawan Zhang",
  title =        "{PQG-A2SA}: Performance Quantification Guided
                 Audio-to-Score Alignment for Orchestral Music",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1982--1992",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Audio- to-score alignment is a multi-modal task that
                 aims at generating an accurate mapping between symbolic
                 and signal-level representations of musical signals,
                 which is important for music performance analysis and
                 retrieval. Among numerous music genres, \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jingen Ni and Ningning Zhang and Haofen Li",
  title =        "Sparsity-Promoting Affine Projection Algorithm With
                 Periodically-Updated Gain Matrix and Its Performance
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "1993--2003",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Sparse system identification is often encountered in
                 applications such as network and acoustic echo
                 cancellation. This work applies the sparsity promoting
                 method to the affine projection algorithm (APA) to
                 develop a sparsity-promoting APA (SAPA). To \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Orchisama Das and Sebastian J. Schlecht and Enzo {De
  title =        "Grouped Feedback Delay Networks With
                 Frequency-Dependent Coupling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2004--2015",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Feedback Delay Networks are one of the most popular
                 and efficient means of generating artificial
                 reverberation. Recently, we proposed the Grouped
                 Feedback Delay Network (GFDN), which couples multiple
                 FDNs while maintaining system stability. The GFDN can
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xudong Zhao and Gongping Huang and Jingdong Chen and
                 Jacob Benesty",
  title =        "Design of {$2$D} and {$3$D} Differential Microphone
                 Arrays With a Multistage Framework",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2016--2031",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Differential microphone arrays (DMAs) have
                 demonstrated a great potential for high-fidelity
                 acoustic and speech signal acquisition in a wide range
                 of applications since such arrays are able to achieve
                 frequency-invariant beampatterns with high \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jia-Hao Hsu and Jeremy Chang and Min-Hsueh Kuo and
                 Chung-Hsien Wu",
  title =        "Empathetic Response Generation Based on Plug-and-Play
                 Mechanism With Empathy Perturbation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2032--2042",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Spoken dialogue systems have rapidly developed but are
                 often viewed as inhumane because they lack empathetic
                 communication skills. In this study, a
                 transformer-based language model (DialoGPT fine-tuned
                 on the EmpatheticDialogues dataset) was combined with
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Aditya Dutt and Paul Gader",
  title =        "Wavelet Multiresolution Analysis Based Speech Emotion
                 Recognition System Using {$1$D} {CNN LSTM} Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2043--2054",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech Emotion Recognition (SER) is the task of
                 recognizing a speaker's emotional state from speech.
                 SER plays a significant role in Human-Computer
                 Interaction and psychological assessment. Several kinds
                 of time-frequency representations like \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Arturo Morales and Juan I. Yuz and Juan P. Cort{\'e}s
                 and Javier G. Fontanet and Mat{\'\i}as Za{\~n}artu",
  title =        "Glottal Airflow Estimation Using Neck Surface
                 Acceleration and Low-Order {Kalman} Smoothing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2055--2066",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The use of non-invasive skin accelerometers placed
                 over the extrathoracic trachea has been proposed in the
                 literature for measuring vocal function. Glottal
                 airflow is estimated using inverse filtering or
                 Bayesian techniques based on a subglottal impedance-.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuya Hosoda and Arata Kawamura and Youji Iiguni",
  title =        "Complex-Domain Pitch Estimation Algorithm for
                 Narrowband Speech Signals",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2067--2078",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "We propose a complex-domain pitch estimation algorithm
                 for narrowband speech signals, which utilizes a complex
                 spectrum containing both amplitude and phase spectrum
                 information. Traditional frequency-domain pitch
                 estimation algorithms assume that a speech \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhidong Liu and Junhui Li and Muhua Zhu",
  title =        "Alleviating Exposure Bias for Neural Machine
                 Translation via Contextual Augmentation and Self
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2079--2089",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In neural machine translation (NMT), most
                 sequence-to-sequence (seq2seq) models are trained only
                 with the teacher-forcing paradigm, where the ground
                 truth history is used to predict the next ground truth
                 word. At the inference stage, however, the decoder
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hanan Beit-On and Tom Shlomo and Boaz Rafaely",
  title =        "Weighted Frequency Smoothing for Enhanced Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2090--2099",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The coherent signal subspace method may be used in
                 order to apply subspace localization methods (e.g.
                 MUSIC) to coherent sources. This method involves a
                 focusing process followed by frequency smoothing, which
                 is intended to decorrelate source signals from
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shan Gao and Xihong Wu and Tianshu Qu",
  title =        "A Physical Model-Based Self-Supervised Learning Method
                 for Signal Enhancement Under Reverberant Environment",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2100--2110",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In a reverberant environment, interferences such as
                 reflections and background noise can degrade the
                 perception of the sound source signal. Although the
                 DNN-based methods have made a tremendous breakthrough
                 in addressing this issue, the performance of \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xue Jiang and Xiulian Peng and Huaying Xue and Yuan
                 Zhang and Yan Lu",
  title =        "Latent-Domain Predictive Neural Speech Coding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2111--2123",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Neural audio/speech coding has recently demonstrated
                 its capability to deliver high quality at much lower
                 bitrates than traditional methods. However, existing
                 neural audio/speech codecs employ either acoustic
                 features or learned blind features with a \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shumin Deng and Jiacheng Yang and Hongbin Ye and
                 Chuanqi Tan and Mosha Chen and Songfang Huang and Fei
                 Huang and Huajun Chen and Ningyu Zhang",
  title =        "{LOGEN}: Few-Shot Logical Knowledge-Conditioned Text
                 Generation With Self-Training",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2124--2133",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Natural language generation from structured data
                 mainly focuses on surface-level descriptions, suffering
                 from uncontrollable content selection and low fidelity.
                 Previous works leverage logical forms to facilitate
                 logical knowledge-conditioned text \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuanzhi Liu and Min He and Qingqing Yang and Gwanggil
  title =        "An Unsupervised Framework With Attention Mechanism and
                 Embedding Perturbed Encoder for Non-Parallel Text
                 Sentiment Style Transfer",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2134--2144",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Text sentiment style transfer aims to extract the
                 sentiment words from a sentence and transfer them into
                 another expected sentiment style while retaining the
                 original sentence's content. However, previous works
                 have not achieved satisfactory \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yang Ai and Zhen-Hua Ling",
  title =        "{APNet}: an All-Frame-Level Neural Vocoder
                 Incorporating Direct Prediction of Amplitude and Phase
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2145--2157",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This paper presents a novel neural vocoder named APNet
                 which reconstructs speech waveforms from acoustic
                 features by predicting amplitude and phase spectra
                 directly. The APNet vocoder is composed of an amplitude
                 spectrum predictor (ASP) and a phase \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Fei Zhao and Zhen Wu and Liang He and Xin-Yu Dai",
  title =        "Label-Correction Capsule Network for Hierarchical Text
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2158--2168",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Hierarchical Text Classification (HTC) aims to predict
                 the category of a document in a given label hierarchy.
                 Considering a parent-child relationship among labels at
                 different levels, previous works mainly leverage the
                 parent-level label information to \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Cem Subakan and Mirco Ravanelli and Samuele Cornell
                 and Fran{\c{c}}ois Grondin and Mirko Bronzi",
  title =        "Exploring Self-Attention Mechanisms for Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2169--2180",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Transformers have enabled impressive improvements in
                 deep learning. They often outperform recurrent and
                 convolutional models in many tasks while taking
                 advantage of parallel processing. Recently, we proposed
                 the SepFormer, which obtains state-of-the-art
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chenggang Zhang and Jinjiang Liu and Hao Li and
                 Xueliang Zhang",
  title =        "Neural Multi-Channel and Multi-Microphone Acoustic
                 Echo Cancellation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2181--2192",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Deep learning is introduced in multi-channel (MC) and
                 multi-microphone (MM) acoustic echo cancellation (AEC)
                 without decorrelation to the loudspeaker signals and
                 achieves remarkable performance. In this article, we
                 propose a complex spectral mapping \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zheng Liu and Xin Kang and Fuji Ren",
  title =        "Dual-{TBNet}: Improving the Robustness of Speech
                 Features via Dual-Transformer-{BiLSTM} for Speech
                 Emotion Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2193--2203",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech emotion recognition has always been one of the
                 topics that have attracted a lot of attention from many
                 researchers. In traditional feature fusion methods, the
                 speech features used only come from the data set, and
                 the weak robustness of features can \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sandro Cumani and Salvatore Sarni",
  title =        "The Distributions of Uncalibrated Speaker Verification
                 Scores: a Generative Model for Domain Mismatch and
                 Trial-Dependent Calibration",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2204--2219",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speaker verification systems that compute
                 log-likelihood ratios (LLR) between the same and
                 different speaker hypotheses allow for cost-effective
                 decisions that depend only on prior information. Domain
                 mismatch, inaccurate model assumptions or the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xi Ai and Bin Fang",
  title =        "Cross-Modal Language Modeling in Multi-Motion-Informed
                 Context for Lip Reading",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2220--2232",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "We observe that for lip reading, the language is
                 locally transformed, instead of globally transformed,
                 i.e., speaking and writing follow the same basic
                 grammar rules. In this work, we present a cross-modal
                 language model to tackle the lip-reading \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Andreas Jonas Fuglsig and Jesper Jensen and Zheng-Hua
                 Tan and Lars S{\o}ndergaard Bertelsen and Jens
                 Christian Lindof and Jan {\O}stergaard",
  title =        "Minimum Processing Near-End Listening Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2233--2245",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The intelligibility and quality of speech from a
                 mobile phone or public announcement system are often
                 affected by background noise in the listening
                 environment. By pre-processing the speech signal it is
                 possible to improve the speech intelligibility and
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhiwen Xie and Runjie Zhu and Jin Liu and Guangyou
                 Zhou and Jimmy Xiangji Huang",
  title =        "{TARGAT}: a Time-Aware Relational Graph Attention
                 Model for Temporal Knowledge Graph Embedding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2246--2258",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Temporal knowledge graph embedding (TKGE) aims to
                 learn the embedding of entities and relations in a
                 temporal knowledge graph (TKG). Although the previous
                 graph neural networks (GNN) based models have achieved
                 promising results, they cannot directly \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Cuilian Zhang and Derek F. Wong and Eddy S. K. Lei and
                 Runzhe Zhan and Lidia S. Chao",
  title =        "Obscurity-Quantified Curriculum Learning for Machine
                 Translation Evaluation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2259--2271",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The pre-trained language model has been developed for
                 evaluating the quality of machine translation. It
                 achieves state-of-the-art results. However, building a
                 model for the evaluation of machine translation still
                 faces the following challenges: (1) large \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yaxin Liu and Yan Zhou and Ziming Li and Junlin Wang
                 and Wei Zhou and Songlin Hu",
  title =        "{HIM}: an End-to-End Hierarchical Interaction Model
                 for Aspect Sentiment Triplet Extraction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2272--2285",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Aspect Sentiment Triplet Extraction (ASTE) is an
                 emerging task of fine-grained sentiment analysis, which
                 aims to extract aspect terms, associated opinion terms,
                 and sentiment polarities in the form of triplets. Thus,
                 ASTE involves two groups of subtasks: \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yukoh Wakabayashi and Kouei Yamaoka and Nobutaka Ono",
  title =        "Sound Field Interpolation for Rotation-Invariant
                 Multichannel Array Signal Processing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2286--2298",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, we present a sound field interpolation
                 for array signal processing (ASP) that is robust to
                 rotation of a circular microphone array (CMA), and we
                 evaluate beamforming as one of its applications. Most
                 ASP methods assume a time-invariant \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jesper Kj{\ae}r Nielsen and Mads Gr{\ae}sb{\o}ll
                 Christensen and Jesper B{\"u}nsow Boldt",
  title =        "An Analysis of Traditional Noise Power Spectral
                 Density Estimators Based on the {Gaussian} Stochastic
                 Volatility Model",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2299--2313",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Many single- and multi-channel speech enhancement
                 techniques, old and new, rely in one way or another on
                 estimates of the noise power spectral density (PSD).
                 For example, the classical Wiener filter requires that
                 either the speech or noise PSD be \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Karen Gissell Rosero Jacome and Felipe Leonel Grijalva
                 and Bruno Sanches Masiero",
  title =        "Sound Events Localization and Detection Using
                 Bio-Inspired Gammatone Filters and Temporal
                 Convolutional Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2314--2324",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The auditory brain circuits are biologically
                 constructed to recand localize sounds by encoding a
                 combination of cues that help individuals interpret
                 sounds. The development of computational methods
                 inspired by human capacities has established \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lin Yuan and Guoheng Huang and Fenghuan Li and
                 Xiaochen Yuan and Chi-Man Pun and Guo Zhong",
  title =        "{RBA-GCN}: Relational Bilevel Aggregation Graph
                 Convolutional Network for Emotion Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2325--2337",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Emotion recognition in conversation (ERC) has received
                 increasing attention from researchers due to its wide
                 range of applications. As conversation has a natural
                 graph structure, numerous approaches used to model ERC
                 based on graph convolutional networks \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Samuel Poirot and Stefan Bilbao and Mitsuko Aramaki
                 and S{\o}lvi Ystad and Richard Kronland-Martinet",
  title =        "A Perceptually Evaluated Signal Model: Collisions
                 Between a Vibrating Object and an Obstacle",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2338--2350",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The collision interaction mechanism between a
                 vibrating string and a non-resonant obstacle is at the
                 heart of many musical instruments. This article focuses
                 on the identification of perceptually salient auditory
                 features related to this phenomenon. The \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Julius Richter and Simon Welker and Jean-Marie
                 Lemercier and Bunlong Lay and Timo Gerkmann",
  title =        "Speech Enhancement and Dereverberation With
                 Diffusion-Based Generative Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2351--2364",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this work, we build upon our previous publication
                 and use diffusion-based generative models for speech
                 enhancement. We present a detailed overview of the
                 diffusion process that is based on a stochastic
                 differential equation and delve into an extensive
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Siarhei Y. Barysenka and Vasili I. Vorobiov",
  title =        "{SNR}-Based Inter-Component Phase Estimation Using
                 Bi-Phase Prior Statistics for Single-Channel Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2365--2381",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The fundamental problem of phase-aware single-channel
                 speech enhancement is the estimation of the harmonic
                 phase of signal components from noisy observations. One
                 approach to obtain an estimate of the harmonic phase is
                 by smoothing the noisy harmonic \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiandian Zeng and Jiantao Zhou and Caishi Huang",
  title =        "Exploring Semantic Relations for Social Media
                 Sentiment Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2382--2394",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "With the massive social media data available online,
                 the conventional single modality emotion classification
                 has developed into more complex models of multimodal
                 sentiment analysis. Most existing works simply
                 extracted image features at a coarse level, \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Fotios Drakopoulos and Sarah Verhulst",
  title =        "A Neural-Network Framework for the Design of
                 Individualised Hearing-Loss Compensation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2395--2409",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Sound processing in the human auditory system is
                 complex and highly non-linear, whereas hearing aids
                 (HAs) still rely on simplified descriptions of auditory
                 processing or hearing loss to restore hearing. Even
                 though standard HA amplification strategies \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xinbei Ma and Zhuosheng Zhang and Hai Zhao",
  title =        "Enhanced Speaker-Aware Multi-Party Multi-Turn Dialogue
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2410--2423",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Multi- party multi-turn dialogue comprehension brings
                 unprecedented challenges in handling complicated
                 scenarios, as the co-occurrence of multiple speakers
                 causes complexity and inconsistency. As a result of the
                 multiple participation, the shift of speaker \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tianrui Wang and Weibin Zhu and Yingying Gao and
                 Shilei Zhang and Junlan Feng",
  title =        "Harmonic Attention for Monaural Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2424--2436",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "To further improve the quality of the enhanced speech,
                 it is appealing that more profound articulatory and
                 auditory knowledge should be introduced into the speech
                 enhancement model. Among these, harmonics seriously
                 affect speech timbre and play a crucial \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lei Lei and Guoshun Yuan and Hongjiang Yu and Dewei
                 Kong and Yuefeng He",
  title =        "Multilingual Customized Keyword Spotting Using
                 Similar-Pair Contrastive Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2437--2447",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The goal of keyword spotting (KWS) is to find words
                 and voice commands. KWS research has received a lot of
                 attention recently. However, the majority of them
                 emphasize predefined KWS. More often than not,
                 customers wish to choose individualized unique
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shaokai Li and Peng Song and Wenming Zheng",
  title =        "Multi-Source Discriminant Subspace Alignment for
                 Cross-Domain Speech Emotion Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2448--2460",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Cross- domain speech emotion recognition (SER) is an
                 effective strategy to improve the generalization
                 ability of emotion classification models, which is an
                 important research direction in speech signal
                 processing. However, since the speech signals are non-.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yeqing Ren and Haipeng Peng and Lixiang Li and
                 Xiaopeng Xue and Yang Lan and Yixian Yang",
  title =        "Generalized Voice Spoofing Detection via Integral
                 Knowledge Amalgamation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2461--2475",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Most of the voice spoofing detection methods are
                 designed for specific kinds of spoofing attacks,
                 synthetic or replay. In practice, however, there is no
                 prior information about these two kinds of spoofing
                 attacks. To this end, this paper proposes a \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xing Chen and Jie Wang and Xiao-Lei Zhang and
                 Wei-Qiang Zhang and Kunde Yang",
  title =        "{LMD}: a Learnable Mask Network to Detect Adversarial
                 Examples for Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2476--2490",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Although the security of automatic speaker
                 verification (ASV) is seriously threatened by recently
                 emerged adversarial attacks, there have been some
                 countermeasures to alleviate the threat. However, many
                 defense approaches not only require the prior
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Benjamin Yen and Yameizhen Li and Yusuke Hioka",
  title =        "Rotor Noise-Aware Noise Covariance Matrix Estimation
                 for Unmanned Aerial Vehicle Audition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2491--2506",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "A noise covariance matrix (NCM) estimation method for
                 unmanned aerial vehicle (UAV) audition is proposed with
                 rotor noise reduction as its primary focus. The
                 proposed NCM estimation method could be incorporated
                 into audio processing algorithms using UAV-. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xuechen Liu and Xin Wang and Md Sahidullah and Jose
                 Patino and H{\'e}ctor Delgado and Tomi Kinnunen and
                 Massimiliano Todisco and Junichi Yamagishi and Nicholas
                 Evans and Andreas Nautsch and Kong Aik Lee",
  title =        "{ASVspoof 2021}: Towards Spoofed and Deepfake Speech
                 Detection in the Wild",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2507--2522",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Benchmarking initiatives support the meaningful
                 comparison of competing solutions to prominent problems
                 in speech and language processing. Successive
                 benchmarking evaluations typically reflect a
                 progressive evolution from ideal lab conditions towards
                 to \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zal{\'a}n Borsos and Rapha{\"e}l Marinier and Damien
                 Vincent and Eugene Kharitonov and Olivier Pietquin and
                 Matt Sharifi and Dominik Roblek and Olivier Teboul and
                 David Grangier and Marco Tagliasacchi and Neil
  title =        "{AudioLM}: a Language Modeling Approach to Audio
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2523--2533",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "We introduce AudioLM, a framework for high-quality
                 audio generation with long-term consistency. AudioLM
                 maps the input audio to a sequence of discrete tokens
                 and casts audio generation as a language modeling task
                 in this representation space. We show how \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xingfeng Li and Xiaohan Shi and Desheng Hu and Yongwei
                 Li and Qingchen Zhang and Zhengxia Wang and Masashi
                 Unoki and Masato Akagi",
  title =        "Music Theory-Inspired Acoustic Representation for
                 Speech Emotion Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2534--2547",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This research presents a music theory-inspired
                 acoustic representation (hereafter, MTAR) to address
                 improved speech emotion recognition. The recognition of
                 emotion in speech and music is developed in parallel,
                 yet a relatively limited understanding of \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiachen Lian and Chunlei Zhang and Gopala K.
                 Anumanchipalli and Dong Yu",
  title =        "Unsupervised {TTS} Acoustic Modeling for {TTS} With
                 Conditional Disentangled Sequential {VAE}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2548--2557",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, we propose a novel unsupervised
                 text-to-speech acoustic model training scheme, named
                 UTTS, which does not require text-audio pairs. UTTS is
                 a multi-speaker speech synthesizer that supports
                 zero-shot voice cloning, it is developed from a
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Arsalan Malik and Nipun Agarwal and Harshavardhan
                 Settibhaktini and Ananthakrishna Chintanpalli",
  title =        "Predicting Level-Dependent Changes in Concurrent Vowel
                 Scores Using the {$2$D-CNN} Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2558--2566",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Differences in fundamental frequencies (F0s) are an
                 important cue for segregating multiple speakers.
                 However, the ability to avail this cue for
                 identification varies with sound levels. For
                 different-and same-F0 conditions, the identification
                 scores of \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Michael Krause and Meinard M{\"u}ller",
  title =        "Hierarchical Classification for Instrument Activity
                 Detection in Orchestral Music Recordings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2567--2578",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Instrument activity detection is a fundamental task in
                 music information retrieval, serving as a basis for
                 many applications, such as music recommendation, music
                 tagging, or remixing. Most published works on this task
                 cover popular music and music for \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Julie Meyer and Sebastian Prepeli{\c{t}}{\u{a}} and
                 Ali Khajeh-Saeed and Michael Smirnov and Pablo
  title =        "Verification on Head-Related Transfer Functions of a
                 Snowman Model Simulated Using the Finite-Difference
                 Time-Domain Method",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2579--2591",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Although finite-difference time-domain (FDTD)
                 simulations are extensively used in acoustics, studies
                 assessing the reliability and the accuracy of the
                 implemented method are scarce. Moreover, the
                 operational validity of a simulation method is
                 context-. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Darius Petermann and Gordon Wichern and Aswin
                 Shanmugam Subramanian and Zhong-Qiu Wang and Jonathan
                 {Le Roux}",
  title =        "Tackling the Cocktail Fork Problem for Separation and
                 Transcription of Real-World Soundtracks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2592--2605",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Emulating the human ability to solve the cocktail
                 party problem, i.e., focus on a source of interest in a
                 complex acoustic scene, is a long standing goal of
                 audio source separation research. In this paper, we
                 focus on the cocktail fork problem, which \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hailong Cao and Liguo Li and Conghui Zhu and Muyun
                 Yang and Tiejun Zhao",
  title =        "Dual Word Embedding for Robust Unsupervised Bilingual
                 Lexicon Induction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2606--2615",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The word embedding models such as Word2vec and
                 FastText simultaneously learn dual representations of
                 input vectors and output vectors. In contrast, almost
                 all existing unsupervised bilingual lexicon induction
                 (UBLI) methods use only input vectors without
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lin Xiao and Pengyu Xu and Mingyang Song and Huafeng
                 Liu and Liping Jing and Xiangliang Zhang",
  title =        "Triple Alliance Prototype Orthotist Network for
                 Long-Tailed Multi-Label Text Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2616--2628",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Multi- label text classification (MLTC) aims to tag
                 the most relevant labels for the given document.
                 Compared to the standard multi-class case where each
                 document has only one label, it is considerably more
                 difficulty to annotate new coming documents for
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Juhua Liu and Qihuang Zhong and Liang Ding and Hua Jin
                 and Bo Du and Dacheng Tao",
  title =        "Unified Instance and Knowledge Alignment Pretraining
                 for Aspect-Based Sentiment Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2629--2642",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The goal of aspect-based sentiment analysis (ABSA) is
                 to determine the sentiment polarity towards an aspect.
                 Because of the expensive and limited amounts of
                 labelled data, the pretraining strategy has become the
                 de facto standard for ABSA. However, there \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yiming Zhang and Hong Yu and Ruoyi Du and Zheng-Hua
                 Tan and Wenwu Wang and Zhanyu Ma and Yuan Dong",
  title =        "{ACTUAL}: Audio Captioning With Caption Feature Space
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2643--2657",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Audio captioning aims at describing the content of
                 audio clips with human language. Due to the ambiguity
                 of audio content, different people may perceive the
                 same audio clip differently, resulting in caption
                 disparities \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jakob Abe{\ss}er and Sascha Grollmisch and Meinard
  title =        "How Robust are Audio Embeddings for Polyphonic Sound
                 Event Tagging?",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2658--2667",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Sound classification algorithms are challenged by the
                 natural variability of everyday sounds, particularly
                 for large sound class taxonomies. In order to be
                 applicable in real-life environments, such algorithms
                 must also be able to handle polyphonic \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wei Xia and John H. L. Hansen",
  title =        "Attention and {DCT} Based Global Context Modeling for
                 Text-Independent Speaker Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2668--2679",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Learning an effective speaker representation is
                 crucial for achieving reliable performance in speaker
                 verification tasks. Speech signals are
                 high-dimensional, long, and variable-length sequences
                 containing diverse information at each time-frequency
                 (TF) \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Takuya Hasumi and Tomohiko Nakamura and Norihiro
                 Takamune and Hiroshi Saruwatari and Daichi Kitamura and
                 Yu Takahashi and Kazunobu Kondo",
  title =        "{PoP-IDLMA}: Product-of-Prior Independent Deeply
                 Learned Matrix Analysis for Multichannel Music Source
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2680--2694",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Independent deeply learned matrix analysis (IDLMA) is
                 a state-of-the-art determined audio source separation
                 method based on pretrained deep neural networks (DNNs).
                 Owing to the excellent expression power of DNNs, IDLMA
                 can handle a wider range of sources \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ben Liu and Jun Wang and Guanyuan Yu and Shaolei
  title =        "{CUPVC}: a Constraint-Based Unsupervised Prosody
                 Transfer for Improving Telephone Banking Services",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2695--2706",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Low efficiency in telephone banking services reduces
                 customer satisfaction. Therefore, some recent studies
                 have concentrated on applying voice conversion models
                 to improve telephone banking services. However,
                 building such a model raises three huge \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Guinan Li and Jiajun Deng and Mengzhe Geng and Zengrui
                 Jin and Tianzi Wang and Shujie Hu and Mingyu Cui and
                 Helen Meng and Xunying Liu",
  title =        "Audio-Visual End-to-End Multi-Channel Speech
                 Separation, Dereverberation and Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2707--2723",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Accurate recognition of cocktail party speech
                 containing overlapping speakers, noise and
                 reverberation remains a highly challenging task to
                 date. Motivated by the invariance of visual modality to
                 acoustic signal corruption, an audio-visual
                 multi-channel \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jean-Marie Lemercier and Julius Richter and Simon
                 Welker and Timo Gerkmann",
  title =        "{StoRM}: a Diffusion-Based Stochastic Regeneration
                 Model for Speech Enhancement and Dereverberation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2724--2737",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Diffusion models have shown a great ability at
                 bridging the performance gap between predictive and
                 generative approaches for speech enhancement. We have
                 shown that they may even outperform their predictive
                 counterparts for non-additive corruption types or
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yen-Ju Lu and Chia-Yu Chang and Cheng Yu and
                 Ching-Feng Liu and Jeih-weih Hung and Shinji Watanabe
                 and Yu Tsao",
  title =        "Improving Speech Enhancement Performance by Leveraging
                 Contextual Broad Phonetic Class Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2738--2750",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Previous studies have confirmed that by augmenting
                 acoustic features with the place/manner of articulatory
                 features, the speech enhancement (SE) process can be
                 guided to consider the broad phonetic properties of the
                 input speech when performing \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sungjae Kim and Yewon Kim and Jewoo Jun and Injung
  title =        "{MuSE-SVS}: Multi-Singer Emotional Singing Voice
                 Synthesizer That Controls Emotional Intensity",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2751--2764",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "We propose a multi-singer emotional singing voice
                 synthesizer, Muse-SVS, that expresses emotion at
                 various intensity levels by controlling subtle changes
                 in pitch, energy, and phoneme duration while accurately
                 following the score. To control multiple \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xinxin Su and Zhen Huang and Yunxiang Zhao and Yifan
                 Chen and Yong Dou and Hengyue Pan",
  title =        "Recent Trends in Deep Learning Based Textual Emotion
                 Cause Extraction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2765--2786",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Emotion Cause Extraction Field (ECEF) focuses on the
                 cause that triggers an emotion in a document.
                 Traditional ECEF aims to extract the cause based on a
                 given emotion while recent ECEF focuses more on
                 extracting both the emotion and its corresponding
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Junyu Lu and Hongfei Lin and Xiaokun Zhang and
                 Zhaoqing Li and Tongyue Zhang and Linlin Zong and
                 Fenglong Ma and Bo Xu",
  title =        "Hate Speech Detection via Dual Contrastive Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2787--2795",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The fast spread of hate speech on social media impacts
                 the Internet environment and our society by increasing
                 prejudice and hurting people. Detecting hate speech has
                 aroused broad attention in the field of natural
                 language processing. Although hate speech \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Diego Marques do Carmo and Ricardo A. Borsoi and
                 M{\'a}rcio Holsbach Costa",
  title =        "Closed-Form Solution to the Multichannel {Wiener}
                 Filter With Interaural Level Difference Preservation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2796--2811",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This article presents a multichannel Wiener filter
                 (MWF) based noise reduction method with preservation of
                 the interaural level difference (ILD). It minimizes the
                 MWF cost function subject to two constraints for ILD
                 preservation. Under this approach, the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ya-Jie Zhang and Chao Zhang and Wei Song and Zhengchen
                 Zhang and Youzheng Wu and Xiaodong He",
  title =        "Prosody Modelling With Pre-Trained Cross-Utterance
                 Representations for Improved Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2812--2823",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "When humans speak multiple utterances in a continuous
                 manner, the prosodic features generated in each
                 utterance are related to those in its neighbouring
                 utterances. Such cross-utterance (CU) dependencies are
                 often ignored by the current neural text-to-.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ching-Yu Chiu and Meinard M{\"u}ller and Matthew E. P.
                 Davies and Alvin Wen-Yu Su and Yi-Hsuan Yang",
  title =        "Local Periodicity-Based Beat Tracking for Expressive
                 Classical Piano Music",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2824--2835",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "To model the periodicity of beats, state-of-the-art
                 beat tracking systems use ``post-processing trackers''
                 (PPTs) that rely on several empirically determined
                 global assumptions for tempo transition, which work
                 well for music with a steady \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Feng Chen and Ke Ma and Yapeng Mao and Desen Yang and
                 Yi Zhang and Jie Shi and Shiqi Mo and Gui Chenyang and
                 Song Li",
  title =        "A Novel Method to Design Steerable Differential
                 Beamformer Using Linear Acoustics Vector Sensor Array",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2836--2849",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Differential beamforming techniques have gained
                 significant attention due to their
                 frequency-independent beampatterns, applicability for
                 small apertures, and super-directivity. It is commonly
                 known that the main lobe of a beam pattern based on a
                 linear \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tianyu Huang and Weisheng Dong and Fangfang Wu and Xin
                 Li and Guangming Shi",
  title =        "Uncertainty-Driven Knowledge Distillation for Language
                 Model Compression",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2850--2858",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Despite the remarkable performance on various Natural
                 Language Processing (NLP) tasks, the parametric
                 complexity of pretrained language models has remained a
                 major obstacle due to limited computational resources
                 in many practical applications. Techniques \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Andr{\'e}s Carofilis and Enrique Alegre and Eduardo
                 Fidalgo and Laura Fern{\'a}ndez-Robles",
  title =        "Improvement of Accent Classification Models Through
                 Grad-Transfer From Spectrograms and Gradient-Weighted
                 Class Activation Mapping",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2859--2871",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Automatic accent classification is an active research
                 field concerning speech processing. It can be useful to
                 identify a speaker's region of origin, which can be
                 applied in police investigations carried out by Law
                 Enforcement Agencies, as well as \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jacob Hollebon and Filippo Maria Fazi",
  title =        "Higher-Order Stereophony",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2872--2885",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This work introduces a new theory for spatial audio
                 recording and reproduction named Higher Order
                 Stereophony. Through the use of the Taylor expansion,
                 the technique accurately reproduces a sound field
                 across a line that is orientated as the interaural
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jeremy H. M. Wong and Huayun Zhang and Nancy F. Chen",
  title =        "Modelling Inter-Rater Uncertainty in Spoken Language
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2886--2898",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In a subjective task, such as Spoken Language
                 Assessment (SLA), the reference scores provided by
                 different human raters may vary. A collection of
                 annotated scores from multiple raters can be
                 interpreted as an expression of data uncertainty.
                 Previous \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qinghua Zheng and Yuefei Wu and Guangtao Wang and
                 Yanping Chen and Wei Wu and Zai Zhang and Bin Shi and
                 Bo Dong",
  title =        "Exploring Interactive and Contrastive Relations for
                 Nested Named Entity Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2899--2909",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Nested named entities (nested NEs) refer to the
                 situation where one named entity is included or nested
                 within another named entity, which cannot be recognized
                 by the traditional sequence labeling methods. Recently,
                 span-based methods have become the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dongyuan Shi and Woon-Seng Gan and Bhan Lam and
                 Zhengding Luo and Xiaoyi Shen",
  title =        "Transferable Latent of {CNN}-Based Selective
                 Fixed-Filter Active Noise Control",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2910--2921",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Practical active noise control (ANC) systems, like the
                 active noise cancellation headphone, usually adopt a
                 control filter with preset coefficients to achieve
                 satisfactory noise reduction performance for dynamic
                 noise and higher robustness. In this \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dorian Desblancs and Vincent Lostanlen and Romain
  title =        "Zero-Note Samba: Self-Supervised Beat Tracking",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2922--2934",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Supervised machine learning for music information
                 retrieval requires a large annotated training set, and
                 is thus an expensive and time-consuming process. To
                 circumvent this problem, we propose to train deep
                 neural networks to perceive beats in musical \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Nankai Lin and Yingwen Fu and Xiaotian Lin and Dong
                 Zhou and Aimin Yang and Shengyi Jiang",
  title =        "{CL-XABSA}: Contrastive Learning for Cross-Lingual
                 Aspect-Based Sentiment Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2935--2946",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Aspect- based sentiment analysis (ABSA), an
                 extensively researched area in the field of natural
                 language processing (NLP), predicts the sentiment
                 expressed in a text relative to the corresponding
                 aspect. Unfortunately, most languages lack sufficient
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hanmeng Liu and Jian Liu and Leyang Cui and Zhiyang
                 Teng and Nan Duan and Ming Zhou and Yue Zhang",
  title =        "{LogiQA 2.0} --- an Improved Dataset for Logical
                 Reasoning in Natural Language Understanding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2947--2962",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "NLP research on logical reasoning regains momentum
                 with the recent releases of a handful of datasets,
                 notably LogiQA and Reclor. Logical reasoning is
                 exploited in many probing tasks over large Pre-trained
                 Language Models (PLMs) and downstream tasks like
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiangyan Yi and Jianhua Tao and Ruibo Fu and Tao Wang
                 and Chu Yuan Zhang and Chenglong Wang",
  title =        "Adversarial Multi-Task Learning for {Mandarin}
                 Prosodic Boundary Prediction With Multi-Modal
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2963--2973",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Prosodic boundaries are still crucial to the
                 naturalness of end-to-end speech synthesis systems.
                 This article proposes to use adversarial multi-task
                 learning to predict prosodic boundaries. Adversarial
                 multi-task learning is utilized to transfer knowledge
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ji Won Yoon and Hyung Yong Kim and Hyeonseung Lee and
                 Sunghwan Ahn and Nam Soo Kim",
  title =        "Oracle Teacher: Leveraging Target Information for
                 Better Knowledge Distillation of {CTC} Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2974--2987",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Knowledge distillation (KD), best known as an
                 effective method for model compression, aims at
                 transferring the knowledge of a bigger network
                 (teacher) to a much smaller network (student).
                 Conventional KD methods usually employ the teacher
                 model trained in \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sufeng Duan and Hai Zhao and Dongdong Zhang",
  title =        "Syntax-Aware Data Augmentation for Neural Machine
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "2988--2999",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Data augmentation is an effective method for the
                 performance enhancement of neural machine translation
                 (NMT) by generating additional bilingual data. In this
                 article, we propose a novel data augmentation strategy
                 for neural machine translation. Unlike \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tongzheng Liu and Zhihua Lu and Jo{\~a}o Paulo J. da
                 Costa and Tai Fei",
  title =        "A Hybrid Reverberation Model and Its Application to
                 Joint Speech Dereverberation and Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3000--3014",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This article proposes a hybrid reverberation model by
                 integrating two conventional models, namely, the
                 multichannel linear prediction (MCLP) model and the
                 spatial coherence model. The late reverberation is
                 divided into two components. One component is
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Junjun Guo and Junjie Ye and Yan Xiang and Zhengtao
  title =        "Layer-Level Progressive Transformer With Modality
                 Difference Awareness for Multi-Modal Neural Machine
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3015--3026",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Multi- modal neural machine translation (MNMT) aims to
                 translate sentences from the source language into the
                 target language with the aid of corresponding images.
                 Unfortunately, there is a considerable modality gap
                 between the semantic-related images and \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qian Tao and Zhihao Xiong and Bocheng Han and Xiaoyang
                 Fan and Lusi Li",
  title =        "A Novel Unsupervised Approach for Cross-Lingual Word
                 Alignment in Low Isomorphic Embedding Spaces",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3027--3041",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Cross- lingual word alignment is the task for word
                 translation between monolingual word embedding spaces
                 of two different languages. Recent work is mostly based
                 on supervised approaches, while their success relies on
                 bilingual seed dictionaries derived \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jilu Jin and Jacob Benesty and Jingdong Chen and
                 Gongping Huang",
  title =        "Differential Beamforming From a Geometric
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3042--3054",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Differential microphone arrays (DMAs) have
                 demonstrated a great potential for solving the
                 high-fidelity sound acquisition problem in a wide range
                 of applications as they possess many good properties
                 such as frequency-independent beampatterns with high
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Alberto Palomo-Alonso and David Casillas-P{\'e}rez and
                 Silvia Jim{\'e}nez-Fern{\'a}ndez and Jose A.
                 Portilla-Figueras and Sancho Salcedo-Sanz",
  title =        "A Flexible Architecture Using Temporal, Spatial and
                 Semantic Correlation-Based Algorithms for Story
                 Segmentation of Broadcast News",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3055--3069",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this article, we propose a novel flexible
                 architecture, with different algorithmic procedures,
                 for effective story segmentation of broadcast news from
                 subtitle files. The proposed system exploits spatial
                 and temporal distance, as well as sentence \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bolaji Yusuf and Jan {\v{C}}ernock{\'y} and Murat
  title =        "End-to-End Open Vocabulary Keyword Search With
                 Multilingual Neural Representations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3070--3080",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Conventional keyword search systems operate on
                 automatic speech recognition (ASR) outputs, which
                 causes them to have a complex indexing and search
                 pipeline. This has led to interest in ASR-free
                 approaches to simplify the search procedure. We
                 recently \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Adrian Herzog and Srikanth Raj Chetupalli and
                 Emanu{\"e}l A. P. Habets",
  title =        "{AmbiSep}: Joint Ambisonic-to-Ambisonic Speech
                 Separation and Noise Reduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3081--3094",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Blind separation of the sounds in an Ambisonic sound
                 scene is a challenging problem, especially when the
                 spatial impression of these sounds needs to be
                 preserved. In this work, we consider
                 Ambisonic-to-Ambisonic separation of reverberant speech
                 mixtures, \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Po-chun Hsu and Da-rong Liu and Andy T. Liu and
                 Hung-yi Lee",
  title =        "Parallel Synthesis for Autoregressive Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3095--3111",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Autoregressive neural vocoders have achieved
                 outstanding performance in speech synthesis tasks such
                 as text-to-speech and voice conversion. An
                 autoregressive vocoder predicts a sample at some time
                 step conditioned on those at previous time steps.
                 Though \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Siddharth Dalmia and Dmytro Okhonko and Mike Lewis and
                 Sergey Edunov and Shinji Watanabe and Florian Metze and
                 Luke Zettlemoyer and Abdelrahman Mohamed",
  title =        "{LegoNN}: Building Modular Encoder-Decoder Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3112--3126",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "State- of-the-art encoder-decoder models (e.g. for
                 machine translation (MT) or automatic speech
                 recognition (ASR)) are constructed and trained
                 end-to-end as an atomic unit. No component of the model
                 can be (re-)used without the others, making it
                 impossible \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tom Gajecki and Waldo Nogueira",
  title =        "Deep Latent Fusion Layers for Binaural Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3127--3138",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This work addresses the issue of enhancing speech in
                 binaural hearing scenarios. Specifically, we present a
                 method to improve binaural noise reduction by
                 integrating latent features produced by monaural speech
                 enhancement algorithms through the use of \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Huawen Feng and Zhenxi Lin and Qianli Ma",
  title =        "Perturbation-Based Self-Supervised Attention for
                 Attention Bias in Text Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3139--3151",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In text classification, the traditional attention
                 mechanisms usually focus too much on frequent words,
                 and need extensive labeled data in order to learn. This
                 article proposes a perturbation-based self-supervised
                 attention approach to guide attention \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiaxin Zhong and Tao Zhuang and Mengtong Li and Ray
                 Kirby and Mahmoud Karimi and Jing Lu and Dong Zhang",
  title =        "Sidelobe Suppression for a Steerable Parametric Source
                 Using the Sparse Random Array Technique",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3152--3161",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "A steerable parametric source is designed to steer an
                 audio beam without mechanically rotating the source. To
                 achieve this without the generation of grating lobes
                 requires an ultrasonic array with interelement spacing
                 that is less than half the wavelength \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yan Fang and Wei Lu and Xiaodong Liu and Witold
                 Pedrycz and Qi Lang and Jianhua Yang",
  title =        "{CircularE}: a Complex Space Circular Correlation
                 Relational Model for Link Prediction in Knowledge Graph
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3162--3175",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Knowledge graphs are regarded as structured knowledge
                 bases that embody various facts coming from the real
                 world. Their completeness is still far from
                 satisfactory. Relational learning models in link
                 prediction can automatically find the missing
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jie Zhang and Rui Tao and Jun Du and Li-Rong Dai",
  title =        "{SDW-SWF}: Speech Distortion Weighted Single-Channel
                 {Wiener} Filter for Noise Reduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3176--3189",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech enhancement shows an important necessity in
                 many audio applications, particularly in noisy
                 environments, where the speech quality needs to be
                 improved. In this work, we consider the single-channel
                 noise reduction (NR) problem from the conventional
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Haozhou Li and Qinke Peng and Xu Mou and Ying Wang and
                 Zeyuan Zeng and Muhammad Fiaz Bashir",
  title =        "Abstractive Financial News Summarization via
                 Transformer-{BiLSTM} Encoder and Graph Attention-Based
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3190--3205",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Financial news summarization (FNS) has been an
                 attractive research problem in recent years, which aims
                 to generate a shorter highlight of the news article
                 while preserving key factual aspects, emotions, and
                 opinions, providing significant assistance in
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Weitao Yuan and Shengbei Wang and Jianming Wang and
                 Masashi Unoki and Wenwu Wang",
  title =        "Unsupervised Deep Unfolded Representation Learning for
                 Singing Voice Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3206--3220",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Learning effective vocal representations from a
                 waveform mixture is a crucial but challenging task for
                 deep neural network (DNN)-based singing voice
                 separation (SVS). Successful representation learning
                 (RL) depends heavily on well-designed neural \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhong-Qiu Wang and Samuele Cornell and Shukjae Choi
                 and Younglo Lee and Byeong-Yeol Kim and Shinji
  title =        "{TF-GridNet}: Integrating Full- and Sub-Band Modeling
                 for Speech Separation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3221--3236",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "We propose TF-GridNet for speech separation. The model
                 is a novel deep neural network (DNN) integrating full-
                 and sub-band modeling in the time-frequency (T-F)
                 domain. It stacks several blocks, each consisting of an
                 intra-frame full-band module, a sub-. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Marvin Tammen and Simon Doclo",
  title =        "Parameter Estimation Procedures for Deep Multi-Frame
                 {MVDR} Filtering for Single-Microphone Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3237--3248",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Aiming at exploiting temporal correlations across
                 consecutive time frames in the short-time Fourier
                 transform (STFT) domain, multi-frame algorithms for
                 single-microphone speech enhancement have been
                 proposed. Typically, the multi-frame filter
                 coefficients \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yi Lin and Qingyang Wang and Xincheng Yu and Zichen
                 Zhang and Dongyue Guo and Jizhe Zhou",
  title =        "Towards Recognition for Radio-Echo Speech in Air
                 Traffic Control: Dataset and a Contrastive Learning
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3249--3262",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In the air traffic control (ATC) domain, automatic
                 speech recognition (ASR) suffers from radio speech
                 echo, which cannot be addressed by existing echo
                 cancellation due to auditory-oriented optimization and
                 poor generalization ability caused by volatile
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Diego Caviedes-Nozal and Efren Fernandez-Grande",
  title =        "Spatio-Temporal {Bayesian} Regression for Room Impulse
                 Response Reconstruction With Spherical Waves",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3263--3277",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The reconstruction of sound fields in a room from a
                 limited set of measurements is a central problem in
                 acoustics, with relevant applications in e.g. acoustic
                 analysis, audio, or sound field control. Conventional
                 approaches rely on measuring the room \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xinyu Hu and Xiaojun Wan",
  title =        "{RST} Discourse Parsing as Text-to-Text Generation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3278--3289",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Previous studies have made great advances in RST
                 discourse parsing through specific neural frameworks or
                 features, but they usually split the parsing process
                 into two subtasks and heavily depended on gold
                 discourse segmentation. In this article, we \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shun Lei and Yixuan Zhou and Liyang Chen and Zhiyong
                 Wu and Xixin Wu and Shiyin Kang and Helen Meng",
  title =        "{MSStyleTTS}: Multi-Scale Style Modeling With
                 Hierarchical Context Information for Expressive Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3290--3303",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Expressive speech synthesis is crucial for many
                 human-computer interaction scenarios, such as
                 audiobooks, podcasts, and voice assistants. Previous
                 works focus on predicting the style embeddings at one
                 single scale from the information within the current
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Pedro Izquierdo Lehmann and Rodrigo F. C{\'a}diz and
                 Carlos A. Sing Long",
  title =        "Towards Maximizing a Perceptual {{\em Sweet Spot\/}}
                 for Spatial Sound With Loudspeakers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3304--3319",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The {\em sweet spot\/} can be interpreted as the
                 region where acoustic sources create a spatial auditory
                 illusion. We study the problem of maximizing this sweet
                 spot when reproducing a desired sound wave using an
                 array of loudspeakers. To achieve \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Han Zhu and Dongji Gao and Gaofeng Cheng and Daniel
                 Povey and Pengyuan Zhang and Yonghong Yan",
  title =        "Alternative Pseudo-Labeling for Semi-Supervised
                 Automatic Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3320--3330",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "When labeled data is insufficient, pseudo-labeling
                 based semi-supervised learning can significantly
                 improve the performance of automatic speech
                 recognition. However, pseudo-labels are often noisy,
                 containing numerous incorrect tokens. Taking noisy
                 labels \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Junqing Zhang and Liming Shi and Mads Gr{\ae}sb{\o}ll
                 Christensen and Wen Zhang and Lijun Zhang and Jingdong
  title =        "{CGMM}-Based Sound Zone Generation Using Robust
                 Pressure Matching With {ATF} Perturbation Constraints",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3331--3345",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Personal sound zone (PSZ) refers to the technique that
                 uses an array of loudspeakers and digital signal
                 processing tools to achieve spatial soundfield control.
                 To generate the target sound zones, this technique
                 generally requires to know the acoustic \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Erfan Loweimi and Andrea Carmantini and Peter Bell and
                 Steve Renals and Zoran Cvetkovic",
  title =        "Phonetic Error Analysis Beyond Phone Error Rate",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3346--3361",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this article, we analyse the performance of the
                 TIMIT-based phone recognition systems beyond the
                 overall phone error rate (PER) metric. We consider
                 three broad phonetic classes (BPCs): affricate,
                 diphthong, fricative, nasal, plosive, semi-vowel,
                 vowel, \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Runxuan Yang and Yuyang Peng and Xiaolin Hu",
  title =        "A Fast High-Fidelity Source-Filter Vocoder With
                 Lightweight Neural Modules",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3362--3373",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The quality of raw audio waveform generated by a
                 vocoder could affect various audio generative tasks. In
                 recent years, the dominance of source-filter vocoders
                 was greatly challenged by neural vocoders as the latter
                 presents far superior synthesized audio \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuxiang Zhang and Zhuo Li and Jingze Lu and Hua Hua
                 and Wenchao Wang and Pengyuan Zhang",
  title =        "The Impact of Silence on Speech Anti-Spoofing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3374--3389",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The current speech anti-spoofing countermeasures (CMs)
                 show excellent performance on specific datasets.
                 However, removing the silence of test speech through
                 Voice Activity Detection (VAD) can severely degrade
                 performance. In this article, the impact of \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Philippe Gonzalez and Tommy Sonne Alstr{\o}m and
                 Tobias May",
  title =        "Assessing the Generalization Gap of Learning-Based
                 Speech Enhancement Systems in Noisy and Reverberant
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3390--3403",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The acoustic variability of noisy and reverberant
                 speech mixtures is influenced by multiple factors, such
                 as the spectro-temporal characteristics of the target
                 speaker and the interfering noise, the signal-to-noise
                 ratio (SNR) and the room \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ziyi Xu and Ziyue Zhao and Tim Fingscheidt",
  title =        "Coded Speech Quality Measurement by a Non-Intrusive
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3404--3417",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Wideband codecs such as AMR-WB or EVS are widely used
                 in (mobile) speech communication. Evaluation of coded
                 speech quality is often performed subjectively by an
                 absolute category rating (ACR) listening test. However,
                 the ACR test is impractical for online \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tao Li and Chenxu Hu and Jian Cong and Xinfa Zhu and
                 Jingbei Li and Qiao Tian and Yuping Wang and Lei Xie",
  title =        "{DiCLET-TTS}: Diffusion Model Based Cross-Lingual
                 Emotion Transfer for Text-to-Speech --- a Study Between
                 {English} and {Mandarin}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3418--3430",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "While the performance of cross-lingual TTS based on
                 monolingual corpora has been significantly improved
                 recently, generating cross-lingual speech still suffers
                 from the foreign accent problem, leading to limited
                 naturalness. Besides, current cross-lingual \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xuexin Xu and Liang Shi and Xunquan Chen and Pingyuan
                 Lin and Jie Lian and Jinhui Chen and Zhihong Zhang and
                 Edwin R. Hancock",
  title =        "Any-to-Any Voice Conversion With Multi-Layer Speaker
                 Adaptation and Content Supervision",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3431--3445",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Any- to-any voice conversion can be performed among
                 arbitrary speakers, even with a single reference
                 utterance. Many related studies have demonstrated that
                 it can be effectively implemented by speech
                 representation disentanglement. However, most existing
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chenpeng Du and Yiwei Guo and Xie Chen and Kai Yu",
  title =        "Speaker Adaptive Text-to-Speech With Timbre-Normalized
                 Vector-Quantized Feature",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3446--3456",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Achieving high fidelity and speaker similarity in
                 text-to-speech speaker adaptation with limited amount
                 of data is a challenging task. Most existing methods
                 only consider adapting to the timbre of the target
                 speakers but fail to capture their speaking \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yash Kumar Atri and Vikram Goyal and Tanmoy
  title =        "Multi-Document Summarization Using Selective Attention
                 Span and Reinforcement Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3457--3467",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Abstractive text summarization systems using recently
                 improved RNN-based sequence-to-sequence architecture
                 have shown great promise for single-document
                 summarization. However, such neural models fail to
                 perpetuate the performance in the multi-document
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Maochun Huang and Chunmei Qing and Junpeng Tan and
                 Xiangmin Xu",
  title =        "Context-Based Adaptive Multimodal Fusion Network for
                 Continuous Frame-Level Sentiment Prediction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3468--3477",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Recently, video sentiment computing has become the
                 focus of research because of its benefits in many
                 applications such as digital marketing, education,
                 healthcare, and so on. The difficulty of video
                 sentiment prediction mainly lies in the regression
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sebastian J. Schlecht and Jon Fagerstr{\"o}m and Vesa
  title =        "Decorrelation in Feedback Delay Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3478--3487",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The feedback delay network (FDN) is a popular filter
                 structure to generate artificial spatial reverberation.
                 A common requirement for multichannel late
                 reverberation is that the output signals are well
                 decorrelated, as too high a correlation can lead to
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jinliang Lu and Jiajun Zhang",
  title =        "Towards Unified Multi-Domain Machine Translation With
                 Mixture of Domain Experts",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3488--3498",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Multi- domain machine translation (MDMT) aims to
                 construct models with mixed-domain training corpora to
                 switch translation between different domains. Previous
                 studies either assume that the domain information is
                 given and leverage the domain knowledge to \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Julien Hauret and Thomas Joubaud and V{\'e}ronique
                 Zimpfer and {\'E}ric Bavu",
  title =        "Configurable {EBEN}: Extreme Bandwidth Extension
                 Network to Enhance Body-Conducted Speech Capture",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3499--3512",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This article presents a configurable version of
                 Extreme Bandwidth Extension Network (EBEN), a
                 Generative Adversarial Network (GAN) designed to
                 improve audio captured with body-conduction
                 microphones. We show that although these microphones
                 significantly \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wanli Peng and Sheng Li and Zhenxing Qian and Xinpeng
  title =        "Text Steganalysis Based on Hierarchical Supervised
                 Learning and Dual Attention Mechanism",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3513--3526",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Recent methods with deep neural networks for text
                 steganalysis have succeeded in mining various feature
                 representations. However, a limited number of studies
                 have explicitly analyzed potential security issues of
                 generative text steganography. Furthermore, \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lin Xu and Qixian Zhou and Jinlan Fu and See-Kiong
  title =        "{CET2}: Modelling Topic Transitions for Coherent and
                 Engaging Knowledge-Grounded Conversations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3527--3536",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Knowledge- grounded dialogue systems aim to generate
                 coherent and engaging responses based on the dialogue
                 contexts and selected external knowledge. Previous
                 knowledge selection methods tend to rely too heavily on
                 the dialogue contexts or over-emphasize \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Vincent W. Neo and Christine Evers and Stephan Weiss
                 and Patrick A. Naylor",
  title =        "Signal Compaction Using Polynomial {EVD} for Spherical
                 Array Processing With Applications",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3537--3549",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Multi- channel signals captured by spatially separated
                 sensors often contain a high level of data redundancy.
                 A compact signal representation enables more efficient
                 storage and processing, which has been exploited for
                 data compression, noise reduction, and \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Gerald Enzner and Svantje Voit",
  title =        "Hybrid- Frequency-Resolution Adaptive {Kalman} Filter
                 for Online Identification of Long Acoustic Responses
                 With Low Input-Output Latency",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3550--3563",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Online acoustic system identification is one of the
                 most challenging tasks for adaptive filters. Along with
                 the desired accuracy in applications such as acoustic
                 echo cancellation, it bears requirements of
                 accommodating high-order systems \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shang Gao and Maoshen Jia and Dingding Yao and Jing
  title =        "Multi-Source Localization Using Optimized
                 Time-Frequency Representation and Sparsity Component
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3564--3578",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This article aims to address the multi-source
                 localization problem by exploiting the sparsity of the
                 speech signal in the time-frequency domain, where the
                 challenge mainly lies in extracting the sparse
                 component. An optimized time-frequency representation
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qi He and Mingjie Gao and Ka Fai Cedric Yiu and Sven
  title =        "Distributed Microphone Array Localization Problem via
                 {SDP-SOCP} Method",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3579--3588",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In multimedia applications, it is common to employ
                 acoustic sensors collectively to enhance signals and to
                 locate sound sources. A direct problem can be
                 formulated to locate sound sources from a set of known
                 sensors. In order to form the acoustic sensor
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hiroshi Sawada and Rintaro Ikeshita and Keisuke
                 Kinoshita and Tomohiro Nakatani",
  title =        "Multi-Frame Full-Rank Spatial Covariance Analysis for
                 Underdetermined Blind Source Separation and
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3589--3602",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Full- rank spatial covariance analysis (FCA) is a
                 technique for blind source separation (BSS), and can be
                 applied to underdetermined situations where the sources
                 outnumber the microphones. This paper proposes
                 multi-frame FCA as an extension of FCA to \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hongyang Chang and Hongfei Xu and Josef van Genabith
                 and Deyi Xiong and Hongying Zan",
  title =        "{JoinER-BART}: Joint Entity and Relation Extraction
                 With Constrained Decoding, Representation Reuse and
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3603--3616",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Joint Entity and Relation Extraction (JERE) is an
                 important research direction in Information Extraction
                 (IE). Given the surprising performance with fine-tuning
                 of pre-trained BERT in a wide range of NLP tasks,
                 nowadays most studies for JERE are based on \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xinqi Huang and Yingsong Li and Yuriy Zakharov and
                 Yongchun Miao and Zhixiang Huang",
  title =        "Squared Sine Adaptive Algorithm and Its Performance
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3617--3628",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The squared sine adaptive (SSA) algorithm is presented
                 for identification scenarios, such as acoustic-echo
                 cancellation (AEC) applications, in non-Gaussian
                 environments. To devise the SSA algorithm, a novel cost
                 function is constructed by exerting a \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Andong Li and Guochen Yu and Chengshi Zheng and Wenzhe
                 Liu and Xiaodong Li",
  title =        "A General Unfolding Speech Enhancement Method
                 Motivated by {Taylor}'s Theorem",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3629--3646",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "While deep neural networks have facilitated
                 significant advancements in the field of speech
                 enhancement, most existing methods are developed
                 following either empirical or relatively blind
                 criteria, lacking adequate guidelines in pipeline
                 design. Inspired \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bin Gu and Jie Zhang and Wu Guo",
  title =        "A Dynamic Convolution Framework for
                 Session-Independent Speaker Embedding Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3647--3658",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speaker verification (SV) has suffered from session
                 variability in complex acoustic scenarios, and learning
                 session independent speaker representations remains a
                 challenging problem. To tackle this, we propose a
                 dynamic convolution framework for SV in \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Daojian Zeng and Chao Zhao and Chao Jiang and Jianling
                 Zhu and Jianhua Dai",
  title =        "Document-Level Relation Extraction With Context Guided
                 Mention Integration and Inter-Pair Reasoning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3659--3666",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Document- level Relation Extraction (DRE) aims to
                 recognize the relations between two entities. The
                 entity may correspond to multiple mentions that span
                 beyond the sentence boundary. Few previous studies have
                 investigated the mention integration, which may
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lu Li and Maoshen Jia and Jing Wang and Ruiyuan Cao",
  title =        "Multiple-Speech-Source {DOA} Estimation Based on
                 Single-Source Cluster Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3667--3680",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This study proposes multiple-speech-source direction
                 -of-arrival (DOA) estimation based on the distribution
                 characteristic of the time-frequency (TF) point
                 dominated by a single-source component (i.e.,
                 single-source point, SSP). By exploring the TF
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaoxiao Miao and Xin Wang and Erica Cooper and
                 Junichi Yamagishi and Natalia Tomashenko",
  title =        "Speaker Anonymization Using Orthogonal {Householder}
                 Neural Network",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3681--3695",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speaker anonymization aims to conceal a speaker's
                 identity while preserving content information in
                 speech. Current mainstream neural-network speaker
                 anonymization systems disentangle speech into
                 prosody-related, content, and speaker \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhengshan Xue and Xiaolei Zhang and Tingxun Shi and
                 Deyi Xiong",
  title =        "{DetTrans}: a Lightweight Framework to Detect and
                 Translate Noisy Inputs Simultaneously",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3696--3705",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Neural machine translation (NMT) systems trained on
                 clean data usually suffer from performance degradation
                 when translating noisy inputs. Existing works attempt
                 to improve the robustness of NMT normally via data
                 augmentation, where synthetic noisy data \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chang Liu and Zhen-Hua Ling and Ling-Hui Chen",
  title =        "Pronunciation Dictionary-Free Multilingual Speech
                 Synthesis Using Learned Phonetic Representations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3706--3716",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This article presents a multilingual speech synthesis
                 approach that leverages learned phonetic
                 representations to eliminate the need for pronunciation
                 dictionaries in target languages. The learned phonetic
                 representations consist of unsupervised phonetic
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Reo Yoneyama and Yi-Chiao Wu and Tomoki Toda",
  title =        "High-Fidelity and Pitch-Controllable Neural Vocoder
                 Based on Unified Source-Filter Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3717--3729",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "We introduce unified source-filter generative
                 adversarial networks (uSFGAN), a waveform generative
                 model conditioned on acoustic features, which
                 represents the source-filter architecture in a
                 generator network. Unlike the previous neural-based
                 source-. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Stefan Thaleiser and Gerald Enzner",
  title =        "Binaural-Projection Multichannel {Wiener} Filter for
                 Cue-Preserving Binaural Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3730--3745",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Former research in binaural speech enhancement has
                 demonstrated a demand of binaural cue preservation
                 beyond the requirements of noise suppression and speech
                 quality. The binaural state-of-the-art is frequently
                 grouped into the class of spatio-temporal \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yixin Wang and Wei Wei and Xiangming Gu and Xiaohong
                 Guan and Ye Wang",
  title =        "Disentangled Adversarial Domain Adaptation for
                 Phonation Mode Detection in Singing and Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3746--3759",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Phonation mode detection predicts phonation modes and
                 their temporal boundaries in singing and speech,
                 holding promise for characterizing voice quality and
                 vocal health. However, it is very challenging due to
                 the domain disparities between training data \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yixuan Zhang and Heming Wang and DeLiang Wang",
  title =        "{$ F0 $} Estimation and Voicing Detection With Cascade
                 Architecture in Noisy Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3760--3770",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "As a fundamental problem in speech processing, pitch
                 tracking has been studied for decades. While strong
                 performance has been achieved on clean speech, pitch
                 tracking in noisy speech is still challenging. Severe
                 non-stationary noises not only corrupt the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhengdao Zhao and Yuhua Wang and Guang Shen and Yuezhu
                 Xu and Jiayuan Zhang",
  title =        "{TDFNet}: Transformer-Based Deep-Scale Fusion Network
                 for Multimodal Emotion Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3771--3782",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "As deep learning technology research continues to
                 progress, artificial intelligence technology is
                 gradually empowering various fields. To achieve a more
                 natural human-computer interaction experience, how to
                 accurately recognize emotional state of speech
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Johannes M. Arend and Christoph P{\"o}rschmann and
                 Stefan Weinzierl and Fabian Brinkmann",
  title =        "Magnitude-Corrected and Time-Aligned Interpolation of
                 Head-Related Transfer Functions",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3783--3799",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Head- related transfer functions (HRTFs) are essential
                 for virtual acoustic realities because they contain all
                 cues for localizing sound sources in three-dimensional
                 space. Acoustic measurements are one way to obtain
                 high-quality HRTFs. To reduce \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Desh Raj and Daniel Povey and Sanjeev Khudanpur",
  title =        "{SURT} 2.0: Advances in Transducer-Based Multi-Talker
                 Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3800--3813",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The Streaming Unmixing and Recognition Transducer
                 (SURT) model was proposed recently as an end-to-end
                 approach for continuous, streaming, multi-talker speech
                 recognition (ASR). Despite impressive results on
                 multi-turn meetings, SURT has notable \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiaming An and Zixiang Ding and Ke Li and Rui Xia",
  title =        "Global-View and Speaker-Aware Emotion Cause Extraction
                 in Conversations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3814--3823",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Emotion cause extraction in conversations, the task of
                 recognizing and extracting the causes behind the
                 emotions in a conversation, is a new and under-explored
                 task. It was previously treated as an utterance-level
                 task, that can only extract cause of one \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuqin Lin and Longbiao Wang and Yanbing Yang and
                 Jianwu Dang",
  title =        "{CFDRN}: a Cognition-Inspired Feature Decomposition
                 and Recombination Network for Dysarthric Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3824--3836",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "As an essential technology in human-computer
                 interactions, automatic speech recognition (ASR)
                 ensures a convenient life for healthy people; however,
                 people with speech disorders, who truly need support
                 from such a technology, have experienced \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "R{\'e}mi Blandin and Simon Stone and Ang{\'e}lique
                 Remacle and Vincent Didone and Peter Birkholz",
  title =        "A Comparative Study of {$3$D} and {$1$D} Acoustic
                 Simulations of the Higher Frequencies of Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3837--3847",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Articulatory synthesis generates speech sounds by
                 simulating the physical phenomena involved in speech
                 production. The accuracy of the physical modelling is
                 expected to affect the naturalness of the synthesis:
                 the more realistic the description is, the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qing Wang and Jixun Yao and Li Zhang and Pengcheng Guo
                 and Lei Xie",
  title =        "Timbre-Reserved Adversarial Attack in Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3848--3858",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "As a type of biometric identification, speaker
                 identification (SID) systems face various attacks.
                 Spoofing attacks imitate target speakers' timbre, while
                 adversarial attacks confuse SID systems with
                 well-designed perturbations. Spoofing mimics \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yachao Li and Junhui Li and Jing Jiang and Shimin Tao
                 and Hao Yang and Min Zhang",
  title =        "P-Transformer: Towards Better Document-to-Document
                 Neural Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3859--3870",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Directly training a document-to-document (Doc2Doc)
                 neural machine translation (NMT) via Transformer from
                 scratch, especially on small datasets, usually fails to
                 converge. Our dedicated probing tasks show that (1)
                 both the absolute position and relative \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chao Xie and Tomoki Toda",
  title =        "Noisy-to-Noisy Voice Conversion Under Variations of
                 Noisy Condition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3871--3882",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Voiceconversion (VC) refers to the transformation of
                 the speaker identity of a speech to the target one
                 without altering the linguistic content. As recent VC
                 techniques have made significant progress, implementing
                 them in real-world scenarios is also \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhichao Wang and Xinsheng Wang and Qicong Xie and Tao
                 Li and Lei Xie and Qiao Tian and Yuping Wang",
  title =        "{MSM-VC}: High-Fidelity Source Style Transfer for
                 Non-Parallel Voice Conversion by Multi-Scale Style
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3883--3895",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In addition to conveying the linguistic content from
                 source speech to converted speech, maintaining the
                 speaking style of source speech also plays an important
                 role in the voice conversion (VC) task, which is
                 essential in many scenarios with highly \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yilin Zhao and Hai Zhao and Sufeng Duan",
  title =        "Multi-Grained Evidence Inference for Multi-Choice
                 Reading Comprehension",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3896--3907",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Multi- choice Machine Reading Comprehension (MRC) is a
                 major and challenging task for machines to answer
                 questions according to provided options. Answers in
                 multi-choice MRC cannot be directly extracted in the
                 given passages, and essentially require \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ye-Qian Du and Jie Zhang and Xin Fang and Ming-Hui Wu
                 and Zhou-Wang Yang",
  title =        "A Semi-Supervised Complementary Joint Training
                 Approach for Low-Resource Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3908--3921",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Both unpaired speech and text have shown to be
                 beneficial for low-resource automatic speech
                 recognition (ASR), which, however were either
                 separately used for pre-training, self-training and
                 language model (LM) training, or jointly used for
                 designing \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Changheng Li and Richard C. Hendriks",
  title =        "Alternating Least-Squares-Based Microphone Array
                 Parameter Estimation for a Single-Source Reverberant
                 and Noisy Acoustic Scenario",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3922--3934",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Acoustic- scene-related parameters such as relative
                 transfer functions (RTFs) and power spectral densities
                 (PSDs) of the target source, late reverberation and
                 ambient noise are essential for microphone array signal
                 processing and are challenging to \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kun Zhou and Yuanhang Zhou and Wayne Xin Zhao and
                 Ji-Rong Wen",
  title =        "Learning to Perturb for Contrastive Learning of
                 Unsupervised Sentence Representations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3935--3944",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Recently, contrastive learning has been shown
                 effective in fine-tuning pre-trained language models
                 (PLM) to learn sentence representations, which
                 incorporates perturbations into unlabeled sentences to
                 augment semantically related positive examples for
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Georg G{\"o}tz and Sebastian J. Schlecht and Ville
  title =        "Common-Slope Modeling of Late Reverberation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3945--3957",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The decaying sound field in rooms is typically
                 described by energy decay functions (EDFs). Late
                 reverberation can deviate considerably from the ideal
                 diffuse field, for example, in multiple connected rooms
                 or non-uniform absorption material distributions.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Guanhua Chen and Runzhe Zhan and Derek F. Wong and
                 Lidia S. Chao",
  title =        "Multi-Level Curriculum Learning for Multi-Turn
                 Dialogue Generation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3958--3967",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Since deep learning is the dominant paradigm in the
                 multi-turn dialogue generation task, large-scale
                 training data is the key factor affecting the model
                 performance. To make full use of the training data, the
                 existing work directly applied curriculum \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yun-Yen Chuang and Hung-Min Hsu and Kevin Lin and
                 Ray-I. Chang and Hung-Yi Lee",
  title =        "{MetaEx-GAN}: Meta Exploration to Improve Natural
                 Language Generation via Generative Adversarial
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3968--3980",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Generative Adversarial Networks (GANs) have been
                 popularly researched in natural language generation,
                 so-called Language GANs. Existing works adopt
                 reinforcement learning (RL) based methods such as
                 policy gradients for training Language GANs. The
                 previous \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chuxuan Tong and Xi Zheng and Jianhua Li and Xingjun
                 Ma and Longxiang Gao and Yong Xiang",
  title =        "Query-Efficient Black-{Box} Adversarial Attacks on
                 Automatic Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3981--3992",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The susceptibility of Deep Neural Networks (DNNs) to
                 adversarial attacks has raised concerns regarding their
                 practical applications in real-world scenarios.
                 Although the vulnerability of DNNs to adversarial
                 attacks has been extensively studied in the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xixin Wu and Hui Lu and Kun Li and Zhiyong Wu and
                 Xunying Liu and Helen Meng",
  title =        "Hiformer: Sequence Modeling Networks With Hierarchical
                 Attention Mechanisms",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "3993--4003",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The attention-based encoder-decoder structure, such as
                 the Transformer, has achieved state-of-the-art
                 performance on various sequence modeling tasks, e.g.,
                 machine translation (MT) and automatic speech
                 recognition (ASR), benefited from the superior
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ante Wang and Linfeng Song and Lifeng Jin and Junfeng
                 Yao and Haitao Mi and Chen Lin and Jinsong Su and Dong
  title =        "{D$^2$PSG}: Multi-Party Dialogue Discourse Parsing as
                 Sequence Generation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "4004--4013",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Conversational discourse analysis aims to extract the
                 interactions between dialogue turns, which is crucial
                 for modeling complex multi-party dialogues. As the
                 benchmarks are still limited in size and human
                 annotations are costly, the current standard \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Nan Gao and Yongjian Wang and Peng Chen and Jijun
  title =        "Boosting Short Text Classification by Solving the
                 {OOV} Problem",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "31",
  number =       "??",
  pages =        "4014--4024",
  year =         "2023",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:06:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In the field of natural language processing, text
                 classification has received a lot of attention.
                 Compared with long texts, short texts have fewer words
                 and lack contextual semantic information. Existing
                 approaches enrich short text information by linking
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jin Chu Wu and Raghu N. Kacker",
  title =        "Statistical Analysis for Speaker Recognition
                 Evaluation With Data Dependence and Three Score
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1--14",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The speaker recognition evaluation is conducted in a
                 framework in which three score distributions and two
                 decision thresholds are employed, and the statistic of
                 interest is an average of the two weighted sums \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yongwei Zhou and Junwei Bao and Youzheng Wu and
                 Xiaodong He and Tiejun Zhao",
  title =        "Operation-Augmented Numerical Reasoning for Question
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "15--28",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Question answering requiring numerical reasoning,
                 which generally involves symbolic operations such as
                 sorting, counting, and addition, is a challenging task.
                 To address such a problem, existing mixture-of-experts
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Anurenjan Purushothaman and Debottam Dutta and Rohit
                 Kumar and Sriram Ganapathy",
  title =        "Speech Dereverberation With Frequency Domain
                 Autoregressive Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "29--38",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech applications in far-field real world settings
                 often deal with signals that are corrupted by
                 reverberation. The task of dereverberation constitutes
                 an important step to improve the audible quality and to
                 reduce the \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Leyuan Qu and Taihao Li and Cornelius Weber and
                 Theresa Pekarek-Rosin and Fuji Ren and Stefan Wermter",
  title =        "Disentangling Prosody Representations With
                 Unsupervised Speech Reconstruction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "39--54",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Human speech can be characterized by different
                 components, including semantic content, speaker
                 identity and prosodic information. Significant progress
                 has been made in disentangling representations for
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mathias Bach Pedersen and S{\o}ren Holdt Jensen and
                 Zheng-Hua Tan and Jesper Jensen",
  title =        "Data-Driven Non-Intrusive Speech Intelligibility
                 Prediction Using Speech Presence Probability",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "55--67",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Time consuming Speech Intelligibility (SI) listening
                 tests with human subjects can be replaced by
                 algorithmic SI predictors. In recent years, data-driven
                 SI predictors have been showing promising results. A
                 major limiting \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuanbo Hou and Bo Kang and Andrew Mitchell and Wenwu
                 Wang and Jian Kang and Dick Botteldooren",
  title =        "Cooperative Scene-Event Modelling for Acoustic Scene
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "68--82",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Acoustic scene classification (ASC) can be helpful for
                 creating context awareness for intelligent robots.
                 Humans naturally use the relations between acoustic
                 scenes (AS) and audio events (AE) to understand and
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaotong Jiang and Peiwen You and Chen Chen and
                 Zhongqing Wang and Guodong Zhou",
  title =        "Exploring Scope Detection for Aspect-Based Sentiment
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "83--94",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Aspect- based sentiment analysis (ABSA) aims to
                 extract the aspect terms from review text, and to
                 predict the polarity towards the aspect term. Although
                 neural models have achieved competitive results, there
                 are still \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xuenan Xu and Zeyu Xie and Mengyue Wu and Kai Yu",
  title =        "Beyond the Status Quo: a Contemporary Survey of
                 Advances and Challenges in Audio Captioning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "95--112",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Automated audio captioning (AAC), a task that mimics
                 human perception as well as innovatively links audio
                 processing and natural language processing, has
                 overseen much progress over the last few years. AAC
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Federico Miotello and Mirco Pezzoli and Luca
                 Comanducci and Fabio Antonacci and Augusto Sarti",
  title =        "Deep Prior-Based Audio Inpainting Using
                 Multi-Resolution Harmonic Convolutional Neural
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "113--123",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this manuscript, we propose a novel method to
                 perform audio inpainting, i.e., the restoration of
                 audio signals presenting multiple missing parts. Audio
                 inpainting can be interpreted in the context of inverse
                 problems as \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Cristian-Lucian Stanciu and Jacob Benesty and
                 Constantin Paleologu and Ruxandra-Liana Costea and
                 Laura-Maria Dogariu and Silviu Ciochin{\u{a}}",
  title =        "Decomposition-Based {Wiener} Filter Using the
                 {Kronecker} Product and Conjugate Gradient Method",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "124--138",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The identification of long-length impulse responses
                 represents a challenge in the context of many
                 applications, like echo cancellation. Recently, the
                 problem has been addressed in the framework of low-rank
                 systems, \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Huiyao Chen and Yueheng Sun and Meishan Zhang and Min
  title =        "Automatic Noise Generation and Reduction for Text
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "139--150",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Label noise is an important issue in machine learning,
                 which might lead to negative influences on various
                 tasks. Given that real benchmarks for evaluation of
                 noise reduction methods are limited, plenty of studies
                 construct \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiaming Xu and Jian Cui and Yunzhe Hao and Bo Xu",
  title =        "Multi-Cue Guided Semi-Supervised Learning Toward
                 Target Speaker Separation in Real Environments",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "151--163",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "To solve the cocktail party problem in real
                 multi-talker environments, this article proposed a
                 multi-cue guided semi-supervised target speaker
                 separation method (MuSS). Our MuSS integrates three
                 target speaker-related \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yang Xiang and Jesper Lisby H{\o}jvang and Morten
                 H{\o}jfeldt Rasmussen and Mads Gr{\ae}sb{\o}ll
  title =        "A Two-Stage Deep Representation Learning-Based Speech
                 Enhancement Method Using Variational Autoencoder and
                 Adversarial Training",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "164--177",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This article focuses on leveraging deep representation
                 learning (DRL) for speech enhancement (SE). In general,
                 the performance of the deep neural network (DNN) is
                 heavily dependent on the learning of data
                 representation. \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiao Li and Ruirui Liu and Huichou Huang and Qingyao
  title =        "Contrastive Learning for Target Speaker Extraction
                 With Attention-Based Fusion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "178--188",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Given a reference speech clip from the target speaker,
                 Target Speaker Extraction (TSE) is a challenging task
                 that involves extracting the signal of the target
                 speaker from a multi-speaker environment. TSE networks
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaobo Liang and Runze Mao and Lijun Wu and Juntao Li
                 and Min Zhang and Qing Li",
  title =        "Enhancing Low-Resource {NLP} by Consistency Training
                 With Data and Model Perturbations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "189--199",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Natural language processing (NLP) has recently shown
                 significant progress in rich-resource scenarios.
                 However, it is much less effective for low-resource
                 scenarios due to the model easily overfitting to
                 limited training data \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Haisheng Lu and Jiangnan Liang and Chuang Shi",
  title =        "Comments on ``{Primary}-Ambient Extraction Using
                 Ambient Spectrum Estimation for Immersive Spatial Audio
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "200--202",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  note =         "See \cite{He:2015:PAE}.",
  URL =          "",
  abstract =     "In the above paper, He et al. propose a
                 primary-ambient extraction method using ambient phase
                 estimation with a sparsity constraint (APES). The
                 primary-ambient extraction problem is formulated as a
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Szymon Drgas and Lars Bramsl{\o}w and Archontis
                 Politis and Gaurav Naithani and Tuomas Virtanen",
  title =        "Dynamic Processing Neural Network Architecture for
                 Hearing Loss Compensation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "203--214",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This paper proposes neural networks for compensating
                 sensorineural hearing loss. The aim of the hearing loss
                 compensation task is to transform a speech signal to
                 increase speech intelligibility after further \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Femke B. Gelderblom and Tron Vedul Tronstad and
                 Torbj{\o}rn Svendsen and Tor Andre Myrvoll",
  title =        "On the Predictive Power of Objective Intelligibility
                 Metrics for the Subjective Performance of Deep Complex
                 Convolutional Recurrent Speech Enhancement Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "215--226",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech enhancement (SE) systems aim to improve the
                 quality and intelligibility of degraded speech signals
                 obtained from far-field microphones. Subjective
                 evaluation of the intelligibility performance of these
                 SE \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Thomas Haubner and Andreas Brendel and Walter
  title =        "End-to-End Deep Learning-Based Adaptation Control for
                 Linear Acoustic Echo Cancellation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "227--238",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The attenuation of acoustic loudspeaker echoes remains
                 to be one of the open challenges to achieve pleasant
                 full-duplex hands free speech communication. In many
                 modern signal enhancement interfaces, this problem is
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Congcong Jiang and Tieyun Qian and Bing Liu",
  title =        "One General Teacher for Multi-Data Multi-Task: a New
                 Knowledge Distillation Framework for Discourse Relation
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "239--249",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Automatically identifying the discourse relations can
                 help many downstream NLP tasks such as reading
                 comprehension and machine translation. It can be
                 categorized into explicit and implicit discourse \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Khandokar Md. Nayem and Donald S. Williamson",
  title =        "Attention-Based Speech Enhancement Using Human Quality
                 Perception Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "250--260",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Perceptually- inspired objective functions such as the
                 perceptual evaluation of speech quality (PESQ),
                 signal-to-distortion ratio (SDR), and short-time
                 objective intelligibility (STOI), have recently been
                 used to \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ying Zhang and Fandong Meng and Yufeng Chen and Jinan
                 Xu and Jie Zhou",
  title =        "Complex Question Enhanced Transfer Learning for
                 Zero-Shot Joint Information Extraction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "261--275",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Zero- shot information extraction (IE) tasks have
                 attracted great attention recently. However, how to
                 jointly model multiple IE tasks in the zero-shot
                 scenario is still an open question. In this article, we
                 focus on zero-shot \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jingsong Yan and Piji Li and Haibin Chen and Junhao
                 Zheng and Qianli Ma",
  title =        "Does the Order Matter? {A} Random Generative Way to
                 Learn Label Hierarchy for Hierarchical Text
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "276--285",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Hierarchical Text Classification (HTC) is an essential
                 and challenging task due to the difficulty of modeling
                 label hierarchy. Recent generative methods have
                 achieved state-of-the-art performance by flattening the
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Georgios Paraskevopoulos and Theodoros Kouzelis and
                 Georgios Rouvalis and Athanasios Katsamanis and
                 Vassilis Katsouros and Alexandros Potamianos",
  title =        "Sample-Efficient Unsupervised Domain Adaptation of
                 Speech Recognition Systems: a Case Study for Modern
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "286--299",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Modern speech recognition systems exhibit rapid
                 performance degradation under domain shift. This issue
                 is especially prevalent in data-scarce settings, such
                 as low-resource languages, where the diversity of
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ernesto Accolti and Javier Gimenez and Michael
  title =        "Uncertainties of Room Acoustics Simulation Due to
                 Directivity Data of Musical Instruments",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "300--309",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Simulationsand auralization methods in the field of
                 room acoustics require the directivity of sound sources
                 in third-octave frequency bands, which simplifies the
                 calculation algorithms but introduces uncertainty.
                 However, \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yoshiki Masuyama and Kouei Yamaoka and Yuma Kinoshita
                 and Taishi Nakashima and Nobutaka Ono",
  title =        "Causal and Relaxed-Distortionless Response Beamforming
                 for Online Target Source Extraction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "310--324",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, we propose a low-latency beamforming
                 method for target source extraction. Beamforming has
                 been performed in the time-frequency domain and
                 achieved promising results in offline applications.
                 \ldots (More)",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rohit Prabhavalkar and Takaaki Hori and Tara N.
                 Sainath and Ralf Schl{\"u}ter and Shinji Watanabe",
  title =        "End-to-End Speech Recognition: a Survey",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "325--351",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In the last decade of automatic speech recognition
                 (ASR) research, the introduction of deep learning has
                 brought considerable reductions in word error rate of
                 more than 50\% relative, compared to modeling \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yun Zhao and Dexi Liu and Changxuan Wan and Xiping Liu
                 and Jian-yun Nie and Jiaming Liu",
  title =        "{JMS-QA}: a Joint Hierarchical Architecture for Mental
                 Health Question Answering",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "352--363",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "With the increasing scale of mental health problems in
                 modern society, the scarcity of professional assistance
                 is alarming, especially in developing countries. To
                 address this, some online forums have emerged to \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shiwen Ni and Jiawen Li and Min Yang and Hung-Yu Kao",
  title =        "{DropAttack}: a Random Dropped Weight Attack
                 Adversarial Training for Natural Language
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "364--373",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Adversarial training has been proven to be a powerful
                 regularization technique to improve language models. In
                 this work, we propose a novel random \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tiantian Zhu and Yang Qin and Ming Feng and Qingcai
                 Chen and Baotian Hu and Yang Xiang",
  title =        "{BioPRO}: Context-Infused Prompt Learning for
                 Biomedical Entity Linking",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "374--385",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Recent research tends to address the biomedical entity
                 linking problem in a unified framework solely based on
                 surface form matching between mentions and entities.
                 Specifically, these methods focus on addressing \ldots
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiapu Wang and Boyue Wang and Junbin Gao and Simin Hu
                 and Yongli Hu and Baocai Yin",
  title =        "Multi-Level Interaction Based Knowledge Graph
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "386--396",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "With the continuous emergence of new knowledge,
                 Knowledge Graph (KG) typically suffers from the
                 incompleteness problem, hindering the performance of
                 downstream applications. Thus, Knowledge Graph
                 Completion (KGC) has attracted considerable attention.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qiangqiang Zhang and Dongyuan Lin and Yingying Xiao
                 and Yunfei Zheng and Shiyuan Wang",
  title =        "Error Reused Filtered-{$X$} Least Mean Square
                 Algorithm for Active Noise Control",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "397--412",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The conventional active noise control (ANC) system
                 relies on the error-correction learning to design the
                 adaptive controller. However, as the residual noise,
                 the correction error is discarded after each iteration
                 and is still not a perfect input to the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zengrui Jin and Mengzhe Geng and Jiajun Deng and
                 Tianzi Wang and Shujie Hu and Guinan Li and Xunying
  title =        "Personalized Adversarial Data Augmentation for
                 Dysarthric and Elderly Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "413--429",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Despite the rapid progress of automatic speech
                 recognition (ASR) technologies targeting normal speech,
                 accurate recognition of dysarthric and elderly speech
                 remains a highly challenging task to date. It is
                 difficult to collect large quantities of such
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jun Kong and Jin Wang and Xuejie Zhang",
  title =        "Adaptive Ensemble Self-Distillation With Consistent
                 Gradients for Fast Inference of Pretrained Language
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "430--442",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Conditional computation algorithms, e.g., the early
                 exiting (EE) strategy, can accelerate the inference of
                 pretrained language models (PLMs) by exiting shallow
                 layers without calculating the entire model. In
                 addition to the adaptive inference of EE \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sr{\dbar}an Kiti{\'c} and J{\'e}r{\^o}me Daniel",
  title =        "Blind Identification of Ambisonic Reduced Room Impulse
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "443--458",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Qijie Shao and Pengcheng Guo and Jinghao Yan and
                 Pengfei Hu and Lei Xie",
  title =        "Decoupling and Interacting Multi-Task Learning Network
                 for Joint Speech and Accent Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "459--470",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Accents pose significant challenges for speech
                 recognition systems. Although joint automatic speech
                 recognition (ASR) and accent recognition (AR) training
                 has been proven effective in handling multi-accent
                 scenarios, current multi-task ASR-AR approaches
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Han Zhu and Gaofeng Cheng and Jindong Wang and Wenxin
                 Hou and Pengyuan Zhang and Yonghong Yan",
  title =        "Boosting Cross-Domain Speech Recognition With
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "471--485",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The cross-domain performance of automatic speech
                 recognition (ASR) could be severely hampered due to the
                 mismatch between training and testing distributions.
                 Since the target domain usually lacks labeled data, and
                 domain shifts exist at acoustic and \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yile Wang and Yue Zhang and Peng Li and Yang Liu",
  title =        "Gradual Syntactic Label Replacement for Language Model
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "486--496",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Pre- training serves as a foundation of recent NLP
                 models, where language modeling tasks are performed
                 over large texts. Typical models like BERT and GPT take
                 the corpus as a whole and treat each word equally for
                 language modeling. However, recent works \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Penghui Ma and Jianfeng Li and Jingjing Pan and
                 Xiaofei Zhang and Roberto Gil-Pita",
  title =        "Coherent Signal {DOA} Estimation With Coprime Array:
                 Exploiting Signal Subspace Reconstructing Strategy",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "497--508",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Coprime array possesses a larger array aperture and
                 element spacing compared with the conventional uniform
                 linear array (ULA) for the equivalent number of
                 sensors, attracting considerable scholarly attention.
                 However, the direction of arrival (DOA) \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Emma Hamel and Nickvash Kani",
  title =        "Factors That Influence Automatic Recognition of
                 {African-American} Vernacular {English} in
                 Machine-Learning Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "509--516",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Racial bias is a well-documented problem in natural
                 language processing (NLP). The dialectal language used
                 by marginalized groups is often misclassified or
                 mischaracterized by language models, which in turn can
                 further disenfranchise these populations. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jingbei Li and Sipan Li and Ping Chen and Luwen Zhang
                 and Yi Meng and Zhiyong Wu and Helen Meng and Qiao Tian
                 and Yuping Wang and Yuxuan Wang",
  title =        "Joint Multiscale Cross-Lingual Speaking Style Transfer
                 With Bidirectional Attention Mechanism for Automatic
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "517--528",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Automatic dubbing, which generates a corresponding
                 version of the input speech in another language, can be
                 widely utilized in many real-world scenarios, such as
                 video and game localization. In addition to
                 synthesizing the translated scripts, automatic
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Bing Han and Zhengyang Chen and Yanmin Qian",
  title =        "Self-Supervised Learning With Cluster-Aware-{DINO} for
                 High-Performance Robust Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "529--541",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The automatic speaker verification task has achieved
                 great success using deep learning approaches with a
                 large-scale, manually annotated dataset. However,
                 collecting a significant amount of well-labeled data
                 for system building is very difficult and \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kristina Tesch and Timo Gerkmann",
  title =        "Multi-Channel Speech Separation Using Spatially
                 Selective Deep Non-Linear Filters",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "542--553",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In a multi-channel separation task with multiple
                 speakers, we aim to recover all individual speech
                 signals from the mixture. In contrast to single-channel
                 approaches, which rely on the different
                 spectro-temporal characteristics of the speech signals,
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hao-Chen Pei and Hao Fang and Xin Luo and Xin-Shun
  title =        "{Gradformer}: a Framework for Multi-Aspect
                 Multi-Granularity Pronunciation Assessment",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "554--563",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Automatic pronunciation assessment is an indispensable
                 technology in computer-assisted pronunciation training
                 systems. To further evaluate the quality of
                 pronunciation, multi-task learning with simultaneous
                 output of multi-granularity and multi-aspect has
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Garima Sharma and Karthikeyan Umapathy and Sridhar
  title =        "Time-Frequency Scattergrams for Biomedical Audio
                 Signal Representation and Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "564--576",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech, music, and environmental sounds are the main
                 forms of audio signals that are widely studied. There
                 is a certain amount of texture present in every sound,
                 and our human auditory system is not efficient in
                 recognizing and classifying these audio \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhibo Man and Zengcheng Huang and Yujie Zhang and Yu
                 Li and Yuanmeng Chen and Yufeng Chen and Jinan Xu",
  title =        "{WDSRL}: Multi-Domain Neural Machine Translation With
                 Word-Level Domain-Sensitive Representation Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "577--590",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Due to the strong reliance on domain-specific
                 knowledge, the joint learning manner of domain
                 discrimination and translation has been widely
                 considered in the Multi-Domain Neural Machine
                 Translation (MDNMT) task. However, the word ambiguity
                 problem still \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chin-Po Chen and Ho-Hsien Pan and Susan Shur-Fen Gau
                 and Chi-Chun Lee",
  title =        "Using Measures of Vowel Space for Autistic Traits
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "591--607",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Autism Spectrum Disorder (ASD) is a neurodevelopmental
                 disorder that is prevalent and heterogeneous. Autistic
                 traits describe a wide heterogeneity of behavior
                 symptoms of ASD, and these traits are reflections of
                 core neurodevelopment function deficits. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Kevin Wilkinghoff and Frank Kurth",
  title =        "Why Do Angular Margin Losses Work Well for
                 Semi-Supervised Anomalous Sound Detection?",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "608--622",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "State- of-the-art anomalous sound detection systems
                 often utilize angular margin losses to learn suitable
                 representations of acoustic data using an auxiliary
                 task, which usually is a supervised or self-supervised
                 classification task. The underlying idea is \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Aku Rouhe and Tam{\'a}s Gr{\'o}sz and Mikko Kurimo",
  title =        "Principled Comparisons for End-to-End Speech
                 Recognition: Attention vs Hybrid at the $ 1000$-Hour
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "623--638",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "End- to-End speech recognition has become the center
                 of attention for speech recognition research, but
                 Hybrid Hidden Markov Model Deep Neural Network
                 (HMM/DNN) -systems remain a competitive approach in
                 terms of performance. End-to-End models may be better
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yile Wang and Yue Zhang",
  title =        "Lost in Context? {On} the Sense-Wise Variance of
                 Contextualized Word Embeddings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "639--650",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Contextualized word embeddings in language models have
                 given much advance to NLP. Intuitively, sentential
                 information is integrated into the representation of
                 words, which can help model polysemy. However, context
                 sensitivity also leads to the variance of \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Christoph Hold and Ville Pulkki and Archontis Politis
                 and Leo McCormack",
  title =        "Compression of Higher-Order Ambisonic Signals Using
                 Directional Audio Coding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "651--665",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Delivering high-quality spatial audio in the
                 Ambisonics format requires extensive data bandwidth,
                 which may render it inaccessible for many low-bandwidth
                 applications. Existing widely-available multi-channel
                 audio compression codecs are not designed to \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shouhui Wang and Biao Qin",
  title =        "A Novel Joint Training Model for Knowledge Base
                 Question Answering",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "666--679",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In knowledge base question answering (KBQA) systems,
                 relation detection and entity recognition are two core
                 components. However, since the relation detection in
                 KBQA contains thousands of relations and this task
                 always becomes a zero-shot learning task \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Songbin Li and Jingang Wang and Peng Liu and Ke Shi",
  title =        "{SANet}: a Compressed Speech Encoder and Steganography
                 Algorithm Independent Steganalysis Deep Neural
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "680--690",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Most of the existing steganalysis methods for
                 low-bit-rate compressed speech are specifically
                 designed for a particular speech encoder or category of
                 steganography methods, limiting their generalization
                 capability. These methods require pre-selection of
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tarek Kanan and Amani AbedAlghafer and Shadi AlZu'bi
                 and Bilal Hawashin and Ala Mughaid and Ghassan Kanaan
                 and M. M. Kamruzzaman",
  title =        "An Intelligent Health Care System for Detecting Drug
                 Abuse in Social Media Platforms Based on Low Resource
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "691--703",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Lately, the use of the Internet has led to an increase
                 in social networking sites. The world has become an
                 open environment, and social networking sites have been
                 increasingly used to exchange medical experiences, and
                 they have been adopted in many cases \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Alejandro Santorum Varela and Svetlana Stoyanchev and
                 Simon Keizer and Rama Doddipatla and Kate Knill",
  title =        "Entity Resolution in Situated Dialog With Unimodal and
                 Multimodal Transformers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "704--713",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this work we address the entity resolution task for
                 situated multimodal dialog investigating how a unimodal
                 approach, which uses only textual information as input
                 (representing visual attributes as text), compares to a
                 multimodal system, which \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Huang He and Hua Lu and Siqi Bao and Fan Wang and Hua
                 Wu and Zheng-Yu Niu and Haifeng Wang",
  title =        "Learning to Select External Knowledge With Multi-Scale
                 Negative Sampling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "714--720",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The Track-1 of DSTC9 aims to effectively answer user
                 requests or questions during task-oriented dialogues,
                 which are out of the scope of APIs/DB. By leveraging
                 external knowledge resources, relevant information can
                 be retrieved and encoded into the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hua Lu and Zhen Guo and Chanjuan Li and Yunyi Yang and
                 Huang He and Siqi Bao",
  title =        "Towards Building an Open-Domain Dialogue System
                 Incorporated With {Internet} Memes",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "721--726",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In recent years, Internet memes have been widely used
                 in online chatting. Compared with text-based
                 communication, conversations become more expressive and
                 attractive when Internet memes are incorporated. This
                 article presents our solutions for the Meme \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jungwoo Lim and Taesun Whang and Dongyub Lee and
                 Heuiseok Lim",
  title =        "Adaptive Multi-Domain Dialogue State Tracking on
                 Spoken Conversations",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "727--732",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The main objective of the task-oriented dialogue
                 system is to identify the intent and needs of human
                 dialogue. Many existing studies are conducted under the
                 setting of written dialogue, but there always exists a
                 difficulty in coping with real-world spoken \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "David Thulke and Nico Daheim and Christian Dugast and
                 Hermann Ney",
  title =        "Task-Oriented Document-Grounded Dialog Systems by
                 {HLTPR@RWTH} for {DSTC9} and {DSTC10}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "733--741",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This paper summarizes our contributions to the
                 document-grounded dialog tasks at the 9th and 10th
                 Dialog System Technology Challenges (DSTC9 and DSTC10).
                 In both iterations the task consists of three subtasks:
                 first detect whether the current turn is \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Han Wu and Kun Xu and Linqi Song",
  title =        "Structure-Aware Dialogue Modeling Methods for
                 Conversational Semantic Role Labeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "742--752",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Conversational semantic role labeling (CSRL) is
                 believed to be a crucial step toward dialogue
                 understanding. By incorporating the CSRL information
                 into the conversational models, previous work (Xu et
                 al., 2021) has confirmed the usefulness of CSRL to
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhe Chen and Hongcheng Liu and Yu Wang",
  title =        "{DialogMCF}: Multimodal Context Flow for Audio Visual
                 Scene-Aware Dialog",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "753--764",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In recent years, Audio Visual Scene-Aware Dialog
                 (AVSD) has been an active research task in the
                 multimodal dialogue community and has also been a core
                 part of the Dialog System Technology Challenge (DSTC).
                 This task is an extension of conventional visual
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Koichiro Yoshino and Yun-Nung Chen and Paul Crook and
                 Satwik Kottur and Jinchao Li and Behnam Hedayatnia and
                 Seungwhan Moon and Zhengcong Fei and Zekang Li and
                 Jinchao Zhang and Yang Feng and Jie Zhou and Seokhwan
                 Kim and Yang Liu and Di Jin and Alexandros Papangelis
                 and Karthik Gopalakrishnan and Dilek Hakkani-Tur and
                 Babak Damavandi and Alborz Geramifard and Chiori Hori
                 and Ankit Shah and Chen Zhang and Haizhou Li and
                 Jo{\~a}o Sedoc and Luis F. D'Haro and Rafael Banchs and
                 Alexander Rudnicky",
  title =        "Overview of the Tenth Dialog System Technology
                 Challenge: {DSTC10}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "765--778",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This article introduces the Tenth Dialog System
                 Technology Challenge (DSTC-10). This edition of the
                 DSTC focuses on applying end-to-end dialog technologies
                 for five distinct tasks in dialog systems, namely 1.
                 Incorporation of Meme images into open domain
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shekhar Kumar Yadav and Nithin V. George",
  title =        "Joint Dereverberation and Beamforming With Blind
                 Estimation of the Shape Parameter of the Desired Source
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "779--793",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Dereverberation and acoustic beamforming is used to
                 capture the speech of a desired speaker in the presence
                 of interfering speakers in a reverberant room using an
                 array of microphones. Traditionally, to perform these
                 two tasks, the desired speech is \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yanxiong Li and Zhongjie Jiang and Qisheng Huang and
                 Wenchang Cao and Jialong Li",
  title =        "Lightweight Speaker Verification Using Transformation
                 Module With Feature Partition and Fusion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "794--806",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Although many efforts have been made on decreasing the
                 model complexity for speaker verification, it is still
                 challenging to deploy speaker verification systems with
                 satisfactory result on low-resource terminals. We
                 design a transformation module that \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuhan Dai and Zhirui Zhang and Yichao Du and Shengcai
                 Liu and Lemao Liu and Tong Xu",
  title =        "Datastore Distillation for Nearest Neighbor Machine
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "807--817",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Changtao Li and Feiran Yang and Jun Yang",
  title =        "A Two-Stage Approach to Quality Restoration of
                 Bone-Conducted Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "818--829",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Bone- conducted speech is not susceptible to
                 background noise but suffers from poor speech quality
                 and intelligibility due to the limited bandwidth. This
                 paper proposes a two-stage approach to restore the
                 quality of bone-conducted speech, namely, bandwidth
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jie Zhou and Yuanbiao Lin and Qin Chen and Qi Zhang
                 and Xuanjing Huang and Liang He",
  title =        "{CausalABSC}: Causal Inference for Aspect Debiasing in
                 Aspect-Based Sentiment Classification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "830--840",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "As the primary subtask of sentiment analysis,
                 aspect-based sentiment classification (ABSC) aims to
                 predict the sentiment polarity for a given aspect.
                 While recent deep neural models for ABSC have shown
                 good performance, their robustness is limited due to
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ruiying Lu and Bo Chen and Dandan Guo and Dongsheng
                 Wang and Mingyuan Zhou",
  title =        "Hierarchical Topic-Aware Contextualized Transformers",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "841--852",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Training on disjoint fixed-length segments,
                 Transformers convert static word embeddings into
                 contextualized word representations. However, they
                 often restrict the context of a token to the segment it
                 resides in and hence neglect the contextual information
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yaru Zhao and Bo Cheng and Yakun Huang and Zhiguo
  title =        "{FluGCF}: a Fluent Dialogue Generation Model With
                 Coherent Concept Entity Flow",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "853--867",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The integration of external knowledge graphs into
                 dialogue systems effectively mitigates the generation
                 of generic and uninteresting responses. This approach,
                 particularly the explicit modeling of conversation
                 flows from related concept entities, \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Changhao Ding and Zhangjie Fu and Zhongliang Yang and
                 Qi Yu and Daqiu Li and Yongfeng Huang",
  title =        "Context-Aware Linguistic Steganography Model Based on
                 Neural Machine Translation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "868--878",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Linguistic steganography based on text generation is a
                 hot topic in the field of text information hiding.
                 Previous studies have managed to improve the syntactic
                 quality of steganography texts using natural language
                 processing techniques based on deep \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zainab Alhakeem and Se-In Jang and Hong-Goo Kang",
  title =        "Disentangled Representations in Local-Global Contexts
                 for {Arabic} Dialect Identification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "879--890",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this article, we propose a locally and globally
                 informed disentanglement network for Arabic dialect
                 identification (ADI). Our proposed disentanglement
                 network aims to detach all irrelevant information
                 (e.g., speaker, gender and channel) from the source
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jae-Hong Lee and Joon-Hyuk Chang",
  title =        "Partitioning Attention Weight: Mitigating Adverse
                 Effect of Incorrect Pseudo-Labels for Self-Supervised
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "891--905",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The performance of automatic speech recognition (ASR)
                 models has been significantly improved owing to
                 advances in deep learning and end-to-end approaches.
                 However, these require a large amount of labeled data,
                 which are expensive to obtain. Semi-. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ryo Fukuda and Katsuhito Sudoh and Satoshi Nakamura",
  title =        "Improving Speech Translation Accuracy and Time
                 Efficiency With Fine-Tuned wav2vec 2.0-Based Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "906--916",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech translation (ST) automatically converts
                 utterances in a source language into text in another
                 language. Splitting continuous speech into shorter
                 segments, known as speech segmentation, plays an
                 important role in ST. Recent segmentation methods
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Seong-Gyun Leem and Daniel Fulford and Jukka-Pekka
                 Onnela and David Gard and Carlos Busso",
  title =        "Selective Acoustic Feature Enhancement for Speech
                 Emotion Recognition With Noisy Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "917--929",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Alexander Bohlender and Ann Spriet and Wouter Tirry
                 and Nilesh Madhu",
  title =        "Spatially Selective Speaker Separation Using a {DNN}
                 With a Location Dependent Feature Extraction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "930--945",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Deep neural networks (DNNs) have proven themselves as
                 an effective means to separate clean speech from noisy
                 mixtures. When there are multiple concurrent talkers,
                 however, unambiguously defining the target output is
                 not trivial, especially if the mixture \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Matan Karo and Arie Yeredor and Itshak Lapidot",
  title =        "Compact Time-Domain Representation for Logical Access
                 Spoofed Audio",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "946--958",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Anti- spoofing is the task of speech authentication.
                 That is, identifying genuine human speech compared to
                 spoofed speech. The main focus of this paper is to
                 suggest new representations for genuine and spoofed
                 speech, based on the probability mass function
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Or Berebi and Zamir Ben-Hur and David Lou Alon and
                 Boaz Rafaely",
  title =        "Analysis and Design of Head-Tracked Compensation for
                 Bilateral Ambisonics",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "959--972",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Virtual and augmented reality technologies demand
                 high-quality spatial sound recording and playback
                 through headphones. However, achieving high-quality
                 binaural reproduction requires a complex recording
                 system and a large number of microphones. To address
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wei Wang and Yanmin Qian",
  title =        "Universal Cross-Lingual Data Generation for Low
                 Resource {ASR}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "973--983",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Significant advances in end-to-end (E2E) automatic
                 speech recognition (ASR) have primarily been
                 concentrated on languages rich in annotated data.
                 Nevertheless, a large proportion of languages
                 worldwide, which are typically low-resource, continue
                 to pose \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Davide Berghi and Philip J. B. Jackson",
  title =        "Leveraging Visual Supervision for Array-Based Active
                 Speaker Detection and Localization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "984--995",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Conventional audio-visual approaches for active
                 speaker detection (ASD) typically rely on visually
                 pre-extracted face tracks and the corresponding
                 single-channel audio to find the speaker in a video.
                 Therefore, they tend to fail every time the face of the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Daniel Aleksander Krause and Guillermo
                 Garc{\'\i}a-Barrios and Archontis Politis and Annamaria
  title =        "Binaural Sound Source Distance Estimation and
                 Localization for a Moving Listener",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "996--1011",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, we investigate the tasks of binaural
                 source distance estimation (SDE) and
                 direction-of-arrival estimation (DOAE) using
                 motion-based cues in a scenario with a walking
                 listener. On top of performing both tasks as separate
                 problems, we study \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Seung-Bin Kim and Sang-Hoon Lee and Ha-Yeong Choi and
                 Seong-Whan Lee",
  title =        "Audio Super-Resolution With Robust Speech
                 Representation Learning of Masked Autoencoder",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1012--1022",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This paper proposes Fre-Painter, a high-fidelity audio
                 super-resolution system that utilizes robust speech
                 representation learning with various masking
                 strategies. Recently, masked autoencoders have been
                 found to be beneficial in learning robust \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Omer Musa Battal and Aykut Ko{\c{c}}",
  title =        "Automatic Construction of Sememe Knowledge Bases From
                 Machine Readable Dictionaries",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1023--1035",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Sememes are the minimum semantic units of natural
                 languages. Words annotated with sememes are organized
                 into Sememe Knowledge Bases (SKBs). SKBs are
                 successfully applied to various high-level language
                 processing tasks as external knowledge bases. However,
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Varun Krishna and Tarun Sai and Sriram Ganapathy",
  title =        "Representation Learning With Hidden Unit Clustering
                 for Low Resource Speech Applications",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1036--1047",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, we describe an approach to
                 self-supervised representation learning from raw audio
                 using a hidden unit clustering (HUC) framework. The
                 input to the model consists of audio samples that are
                 windowed and processed with 1-D convolutional
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhengding Luo and Dongyuan Shi and Woon-Seng Gan and
                 Qirui Huang",
  title =        "Delayless Generative Fixed-Filter Active Noise Control
                 Based on Deep Learning and {Bayesian} Filter",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1048--1060",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The selective fixed-filter active noise control
                 (SFANC) method can select suitable pre-trained control
                 filters to attenuate incoming noises. However, the
                 limited number of pre-trained filters is insufficient
                 to effectively control various forms of noise,
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zewen Chi and Heyan Huang and Luyang Liu and Yu Bai
                 and Xiaoyan Gao and Xian-Ling Mao",
  title =        "Can Pretrained {English} Language Models Benefit
                 Non-{English} {NLP} Systems in Low-Resource
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1061--1074",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Pretrained language models have achieved great success
                 in a wide range of natural language processing (NLP)
                 problems, because they learn language representations
                 from large-scale text corpora and can adapt to
                 downstream tasks by finetuning them on \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rui Liu and Yifan Hu and Haolin Zuo and Zhaojie Luo
                 and Longbiao Wang and Guanglai Gao",
  title =        "Text-to-Speech for Low-Resource Agglutinative Language
                 With Morphology-Aware Language Model Pre-Training",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1075--1087",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Text- to-Speech (TTS) aims to convert the input text
                 to a human-like voice. With the development of deep
                 learning, encoder-decoder based TTS models perform
                 superior performance, in terms of naturalness, in
                 mainstream languages such as Chinese, English,
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shu Jiang and Zuchao Li and Hai Zhao and Weiping
  title =        "Entity-Relation Extraction as Full Shallow Semantic
                 Dependency Parsing",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1088--1099",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Entity- relation extraction is the essential
                 information extraction task and can be decomposed into
                 Named Entity Recognition (NER) and Relation Extraction
                 (RE) subtasks. This paper proposes a novel joint
                 entity-relation extraction method that models the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yoav Vered and Stephen Elliott",
  title =        "A Parallel Analog and Digital Adaptive Feedforward
                 Controller for Active Noise Control",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1100--1108",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Digital adaptive controllers are widely used for
                 feedforward active noise control, especially in
                 headphones. In such applications, the secondary path
                 delay, including the sampling and reconstruction
                 effects, must be shorter than the primary path delay to
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Puning Zhang and Rongjian Zhao and Boran Yang and
                 Yuexian Li and Zhigang Yang",
  title =        "Integrated Syntactic and Semantic Tree for Targeted
                 Sentiment Classification Using Dual-Channel Graph
                 Convolutional Network",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1109--1124",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Targeted sentiment analysis aims to identify the
                 sentiment polarity of specific target mentions in a
                 sentence. Existing methods employ neural networks to
                 extract the relations between target mentions and their
                 contexts. Recent approaches based on graph \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xu Wang and Hainan Zhang and Shuai Zhao and Hongshen
                 Chen and Zhuoye Ding and Zhiguo Wan and Bo Cheng and
                 Yanyan Lan",
  title =        "Debiasing Counterfactual Context With Causal Inference
                 for Multi-Turn Dialogue Reasoning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1125--1132",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In the multi-turn dialogue reasoning task, existing
                 models conduct word-level interaction on the entire
                 context to gather reasoning evidence, which aims to
                 select the logically correct one from the candidate
                 response options. Observing the fact that the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Hoang Ngoc Chau and Tien Dat Bui and Huu Binh Nguyen
                 and Thanh Thi Hien Duong and Quoc Cuong Nguyen",
  title =        "A Novel Approach to Multi-Channel Speech Enhancement
                 Based on Graph Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1133--1144",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Multi- channel speech enhancement aims at utilizing
                 spatial relationships between signals captured from a
                 microphone array along with temporal-spectral
                 information efficiently to estimate the clean target.
                 An emerging approach is to design deep learning-.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuchen Hu and Chen Chen and Qiushi Zhu and Eng Siong
  title =        "{Wav2code}: Restore Clean Speech Representations via
                 Codebook Lookup for Noise-Robust {ASR}",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1145--1156",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Automatic speech recognition (ASR) has gained
                 remarkable successes thanks to recent advances of deep
                 learning, but it usually degrades significantly under
                 real-world noisy conditions. Recent works introduce
                 speech enhancement (SE) as front-end to improve
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tetsuya Ueda and Tomohiro Nakatani and Rintaro
                 Ikeshita and Keisuke Kinoshita and Shoko Araki and
                 Shoji Makino",
  title =        "Blind and Spatially-Regularized Online Joint
                 Optimization of Source Separation, Dereverberation, and
                 Noise Reduction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1157--1172",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This paper proposes a computationally efficient joint
                 optimization algorithm that performs online source
                 separation, dereverberation, and noise reduction based
                 on blind and spatially-regularized processing. When
                 applying such online Blind Source \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Vibhav Agarwal and Sourav Ghosh and Harichandana BSS
                 and Himanshu Arora and Barath Raj Kandur Raja",
  title =        "{TrICy}: Trigger-Guided Data-to-Text Generation With
                 Intent Aware Attention-Copy",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1173--1184",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Data- to-text (D2T) generation is a crucial task in
                 many natural language understanding (NLU) applications
                 and forms the foundation of task-oriented dialog
                 systems. In the context of conversational AI solutions
                 that can work directly with local data on the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Christoph Boeddeker and Aswin Shanmugam Subramanian
                 and Gordon Wichern and Reinhold Haeb-Umbach and
                 Jonathan {Le Roux}",
  title =        "{TS-SEP}: Joint Diarization and Separation Conditioned
                 on Estimated Speaker Embeddings",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1185--1197",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Since diarization and source separation of meeting
                 data are closely related tasks, we here propose an
                 approach to perform the two objectives jointly. It
                 builds upon the target-speaker voice activity detection
                 (TS-VAD) diarization approach, which assumes \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Reza Varzandeh and Simon Doclo and Volker Hohmann",
  title =        "Speech-Aware Binaural {DOA} Estimation Utilizing
                 Periodicity and Spatial Features in Convolutional
                 Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1198--1213",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In recent years, several supervised learning-based
                 approaches have been proposed for estimating the
                 direction of arrival (DOA) of a single talker in noisy
                 and reverberant environments. In the absence of
                 auxiliary information, such as a voice activity
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yigitcan {\"O}zer and Meinard M{\"u}ller",
  title =        "Source Separation of Piano Concertos Using Musically
                 Motivated Augmentation Techniques",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1214--1225",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this work, we address the novel and rarely
                 considered source separation task of decomposing piano
                 concerto recordings into separate piano and orchestral
                 tracks. Being a genre written for a pianist typically
                 accompanied by an ensemble or orchestra, \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lior Frenkel and Shlomo E. Chazan and Jacob
  title =        "Domain Adaptation Using Suitable Pseudo Labels for
                 Speech Enhancement and Dereverberation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1226--1236",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech enhancement and dereverberation approaches
                 based on neural networks are designed to learn a
                 transformation from noisy to clean speech using
                 supervised learning. However, networks trained in this
                 way may fail to effectively handle languages, types
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiahao Zhao and Wenji Mao and Daniel Dajun Zeng",
  title =        "Disentangled Text Representation Learning With
                 Information-Theoretic Perspective for Adversarial
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1237--1247",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Adversarial vulnerability remains a major obstacle to
                 the construction of reliable NLP systems. When
                 imperceptible perturbations are added to raw input
                 text, the performance of a deep learning model may drop
                 dramatically under attacks. Recent work has \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Dong Zhou and Fang Lei and Lin Li and Yongmei Zhou and
                 Aimin Yang",
  title =        "Cross-Modal Interaction via Reinforcement Feedback for
                 Audio-Lyrics Retrieval",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1248--1260",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The task of retrieving audio content relevant to lyric
                 queries and vice versa plays a critical role in
                 music-oriented applications. In this process, robust
                 feature representations have to be learned for two
                 modalities. Furthermore, interactions between
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xuechen Liu and Md Sahidullah and Kong Aik Lee and
                 Tomi Kinnunen",
  title =        "Generalizing Speaker Verification for Spoof Awareness
                 in the Embedding Space",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1261--1273",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Shiyao Cui and Jiangxia Cao and Xin Cong and Jiawei
                 Sheng and Quangang Li and Tingwen Liu and Jinqiao Shi",
  title =        "Enhancing Multimodal Entity and Relation Extraction
                 With Variational Information Bottleneck",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1274--1285",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This article studies the multimodal named entity
                 recognition (MNER) and multimodal relation extraction
                 (MRE), which are important for content analysis and
                 various applications. The core of MNER and MRE lies in
                 incorporating evident visual information to \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yizhou Tan and Haojun Ai and Shengchen Li and Mark D.
  title =        "Acoustic Scene Classification Across Cities and
                 Devices via Feature Disentanglement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1286--1297",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Acoustic Scene Classification (ASC) is a task that
                 classifies a scene according to environmental acoustic
                 signals. Audios collected from different cities and
                 devices often exhibit biases in feature distributions,
                 which may negatively impact ASC \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Orel {Ben Zaken} and Anurag Kumar and Vladimir
                 Tourbabin and Boaz Rafaely",
  title =        "Neural- Network-Based Direction-of-Arrival Estimation
                 for Reverberant Speech --- The Importance of Energetic,
                 Temporal, and Spatial Information",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1298--1309",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Direction- of-arrival (DOA) estimation is a
                 fundamental task in audio signal processing that
                 becomes difficult in real-world environments due to the
                 presence of reverberation. To address this difficulty,
                 Direct-Path Dominance (DPD) tests have been proposed
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Changsheng Quan and Xiaofei Li",
  title =        "{SpatialNet}: Extensively Learning Spatial Information
                 for Multichannel Joint Speech Separation, Denoising and
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1310--1323",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This work proposes a neural network to extensively
                 exploit spatial information for multichannel joint
                 speech separation, denoising and dereverberation, named
                 SpatialNet. In the short-time Fourier transform (STFT)
                 domain, the proposed network performs end-. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Matthew Baas and Herman Kamper",
  title =        "Disentanglement in a {GAN} for Unconditional Speech
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1324--1335",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Can we develop a model that can synthesize realistic
                 speech directly from a latent space, without explicit
                 conditioning? Despite several efforts over the last
                 decade, previous adversarial and diffusion-based
                 approaches still struggle to achieve this, even
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xian Li and Nian Shao and Xiaofei Li",
  title =        "Self-Supervised Audio Teacher-Student Transformer for
                 Both Clip-Level and Frame-Level Tasks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1336--1351",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Self- supervised learning (SSL) has emerged as a
                 popular approach for learning audio representations.
                 One goal of audio self-supervised pre-training is to
                 transfer knowledge to downstream audio tasks, generally
                 including clip-level and frame-level tasks. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yifan Chen and Gaofeng Cheng and Runyan Yang and
                 Pengyuan Zhang and Yonghong Yan",
  title =        "Interrelate Training and Clustering for Online Speaker
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1352--1364",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In clustering-based speaker diarization systems, the
                 embedding clusters for distinctive speakers exhibit
                 wide variability in size and density, posing difficulty
                 for clustering accuracy. In spite of this, with the
                 assistance of the overall distance \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Sheng Feng and Xiaoqian Zhu and Shuqing Ma",
  title =        "Masking Hierarchical Tokens for Underwater Acoustic
                 Target Recognition With Self-Supervised Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1365--1379",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Deep learning has made data-driven methods effective
                 in underwater acoustic target recognition (UATR) using
                 passive sonar signals. However, a major current
                 challenge is the limited availability of underwater
                 acoustic data, leading to suboptimal \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yangyang Zhao and Kai Yin and Zhenyu Wang and Mehdi
                 Dastani and Shihan Wang",
  title =        "Decomposed Deep {$Q$}-Network for Coherent
                 Task-Oriented Dialogue Policy Learning",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1380--1391",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Reinforcement learning (RL) has emerged as a key
                 technique for designing dialogue policies. However,
                 action space inflation in dialogue tasks has led to a
                 heavy decision burden and incoherence problems for
                 dialogue policies. In this paper, we propose a
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jayneel Parekh and Sanjeel Parekh and Pavlo
                 Mozharovskyi and Ga{\"e}l Richard and Florence
  title =        "Tackling Interpretability in Audio Classification
                 Networks With Non-negative Matrix Factorization",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1392--1405",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiuying Chen and Shen Gao and Mingzhe Li and Qingqing
                 Zhu and Xin Gao and Xiangliang Zhang",
  title =        "Write Summary Step-by-Step: a Pilot Study of Stepwise
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1406--1415",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Nowadays, neural text generation has made tremendous
                 progress in abstractive summarization tasks. However,
                 most of the existing summarization models take in the
                 whole document all at once, which sometimes cannot meet
                 the needs in practice. Practically, \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Changkai Lin and Hongju Cheng and Qiang Rao and Yang
  title =        "{M$^3$SA}: Multimodal Sentiment Analysis Based on
                 Multi-Scale Feature Extraction and Multi-Task
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1416--1429",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Sentiment analysis plays an indispensable part in
                 human-computer interaction. Multimodal sentiment
                 analysis can overcome the shortcomings of unimodal
                 sentiment analysis by fusing multimodal data. However,
                 how to extracte improved feature representations
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rui-Chen Zheng and Yang Ai and Zhen-Hua Ling",
  title =        "Incorporating Ultrasound Tongue Images for
                 Audio-Visual Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1430--1444",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Audio- visual speech enhancement (AV-SE) aims to
                 enhance degraded speech along with extra visual
                 information such as lip videos, and has been shown to
                 be more effective than audio-only speech enhancement.
                 This paper proposes the incorporation of ultrasound
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Ritujoy Biswas and Karan Nathwani and Vinayak Abrol",
  title =        "Statistically Guided Near-End Speech Intelligibility
                 Improvement Through Voice Transformation and Transfer
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1445--1456",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In recent developments, speech intelligibility has
                 been improved through an optimal trapezoidal
                 transformation function, which performed normal to
                 Lombard speech conversion via formant shifting. Despite
                 performing well, the optimization took very long to
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Linhui Sun and Shuo Yuan and Aifei Gong and Lei Ye and
                 Eng Siong Chng",
  title =        "Dual-Branch Modeling Based on State-Space Model for
                 Speech Enhancement",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1457--1467",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Traditional time-frequency domain speech enhancement
                 methods either only enhance the amplitude spectral
                 features without changing the phase that contributes to
                 the naturalness, intelligibility and harmonic
                 structure, or improve the estimation of the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Alkis Koudounas and Eliana Pastor and Giuseppe
                 Attanasio and Vittorio Mazzia and Manuel Giollo and
                 Thomas Gueudre and Elisa Reale and Luca Cagliero and
                 Sandro Cumani and Luca de Alfaro and Elena Baralis and
                 Daniele Amberti",
  title =        "Towards Comprehensive Subgroup Performance Analysis in
                 Speech Models",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1468--1480",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The evaluation of spoken language understanding (SLU)
                 systems is often restricted to assessing their global
                 performance or examining predefined subgroups of
                 interest. However, a more detailed analysis at the
                 subgroup level has the potential to uncover \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Wenmeng Xiong and Changchun Bao and Jing Zhou and
                 Maoshen Jia and Jos{\'e} Picheral",
  title =        "Joint {DOA} Estimation and Dereverberation Based on
                 Multi-Channel Linear Prediction Filtering and Azimuth
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1481--1493",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Source localization in reverberant environments has
                 been a prominent research topic in the past two
                 decades. In this paper, instead of the commonly
                 employed time-frequency (TF) bin based methods which
                 rely on empirically selected threshold values, we
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yehav Alkaher and Israel Cohen",
  title =        "Howling Detection and Gain Control for Speech
                 Reinforcement in a Noisy Car Cabin Environment",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1494--1505",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In- car speech communication is particularly
                 challenging due to environmental noise. The speaker's
                 microphone also acquires car and road noises, resulting
                 in a low signal-to-noise ratio and persistent
                 frequency-howls that do not decrease, which \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xinfa Zhu and Yi Lei and Tao Li and Yongmao Zhang and
                 Hongbin Zhou and Heng Lu and Lei Xie",
  title =        "{METTS}: Multilingual Emotional Text-to-Speech by
                 Cross-Speaker and Cross-Lingual Emotion Transfer",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1506--1518",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Previous multilingual text-to-speech (TTS) approaches
                 have considered leveraging monolingual speaker data to
                 enable cross-lingual speech synthesis. However, such
                 data-efficient approaches have ignored synthesizing
                 emotional aspects of speech due to the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Myeonghun Jeong and Minchan Kim and Byoung Jin Choi
                 and Jaesam Yoon and Won Jang and Nam Soo Kim",
  title =        "Transfer Learning for Low-Resource, Multi-Lingual, and
                 Zero-Shot Multi-Speaker Text-to-Speech",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1519--1530",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiadi Yao and Hong Luo and Jun Qi and Xiao-Lei Zhang",
  title =        "Interpretable Spectrum Transformation Attacks to
                 Speaker Recognition Systems",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1531--1545",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiang Chen and Lei Li and Yuqi Zhu and Shumin Deng and
                 Chuanqi Tan and Fei Huang and Luo Si and Ningyu Zhang
                 and Huajun Chen",
  title =        "Sequence Labeling as Non-Autoregressive Dual-Query Set
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1546--1558",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Sequence labeling is a crucial task in the NLP
                 community that aims at identifying and assigning spans
                 within the input sentence. It has wide applications in
                 various fields such as information extraction, dialogue
                 system, and sentiment analysis. However, \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lei Liu and Li Liu and Haizhou Li",
  title =        "Computation and Parameter Efficient Multi-Modal Fusion
                 Transformer for Cued Speech Recognition",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1559--1572",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Cued Speech (CS) is a pure visual coding method used
                 by hearing-impaired people that combines lip reading
                 with several specific hand shapes to make the spoken
                 language visible. Automatic CS recognition (ACSR) seeks
                 to transcribe visual cues of speech into \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Adri{\'a}n Barahona-R{\'\i}os and Tom Collins",
  title =        "{NoiseBandNet}: Controllable Time-Varying Neural
                 Synthesis of Sound Effects Using Filterbanks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1573--1585",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Controllable neural audio synthesis of sound effects
                 is a challenging task due to the potential scarcity and
                 spectro-temporal variance of the data. Differentiable
                 digital signal processing (DDSP) synthesisers have been
                 successfully employed to model and \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Siyuan Wang and Zhongyu Wei and Jiarong Xu and Taishan
                 Li and Zhihao Fan",
  title =        "Unifying Structure Reasoning and Language Pre-Training
                 for Complex Reasoning Tasks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1586--1595",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Recent pre-trained language models (PLMs) equipped
                 with foundation reasoning skills have shown remarkable
                 performance on downstream complex tasks. However, the
                 significant structure reasoning skill has been rarely
                 studied, which involves modeling implicit \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yijing Chu and Sipei Zhao and Feng Niu and Yongzheng
                 Dong and Yuezhe Zhao",
  title =        "A New Diffusion Filtered-{$X$} Affine Projection
                 Algorithm: Performance Analysis and Application in
                 Windy Environment",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1596--1608",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Wind noise caused by turbulent flows over microphones
                 usually has detrimental impacts on the reference signal
                 of an active noise control (ANC) system and degrade its
                 performance considerably. This paper evaluates the
                 influence of wind noise on the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yuquan Le and Zhe Quan and Jiawei Wang and Da Cao and
                 Kenli Li",
  title =        "{$ R^2 $}: a Novel Recall \& Ranking Framework for
                 Legal Judgment Prediction",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1609--1622",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "The legal judgment prediction (LJP) task is to
                 automatically decide appropriate law articles, charges,
                 and term of penalty for giving the fact description of
                 a law case. It considerably influences many real legal
                 applications and has thus attracted the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xiaotong Jiang and Ruirui Bai and Zhongqing Wang and
                 Guodong Zhou",
  title =        "Cross-Domain Aspect-Based Sentiment Classification
                 With Tripartite Graph Modeling",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1623--1635",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Previous studies on cross-domain aspect-based
                 sentiment classification depend on the pivot features
                 or utilize the target data for representation learning,
                 which ignores the correlations between instances and
                 words. In this study, we employ two strategies
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhengyang Chen and Bing Han and Shuai Wang and Yanmin
  title =        "Attention-Based Encoder-Decoder End-to-End Neural
                 Diarization With Embedding Enhancer",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1636--1649",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Deep neural network-based systems have significantly
                 improved the performance of speaker diarization tasks.
                 However, end-to-end neural diarization (EEND) systems
                 often struggle to generalize to scenarios with an
                 unseen number of speakers, while target \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Chenfeng Miao and Qingying Zhu and Minchuan Chen and
                 Jun Ma and Shaojun Wang and Jing Xiao",
  title =        "{EfficientTTS 2}: Variational End-to-End
                 Text-to-Speech Synthesis and Voice Conversion",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1650--1661",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Recently, the field of Text-to-Speech (TTS) has been
                 dominated by one-stage text-to-waveform models which
                 have significantly improved speech quality compared to
                 two-stage models. In this work, we propose EfficientTTS
                 2 (EFTS2), a one-stage high-quality \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Orel Peretz and Israel Cohen",
  title =        "Constant Elevation-Beamwidth Beamforming With
                 Concentric Ring Arrays",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1662--1672",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "A hybrid approach is proposed to efficiently design a
                 constant elevation-beamwidth beamforming with
                 concentric ring arrays (CRAs). The design exploits the
                 degrees of freedom of the array geometry for superior
                 performance. In particular, the ring radii and
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Zhibin Quan and Chi-Man Vong and Weili Zeng and Wankou
  title =        "The {MorPhEMe} Machine: an Addressable Neural Memory
                 for Learning Knowledge-Regularized Deep Contextualized
                 {Chinese} Embedding",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1673--1686",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Deep contextualized embeddings, as learned by large
                 pre-training models, have proven highly effective in
                 various downstream natural language processing tasks.
                 However, the embedding space in these large models
                 lacks explicit regularization, leading to \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Lijian Gao and Qirong Mao and Ming Dong",
  title =        "On Local Temporal Embedding for Semi-Supervised Sound
                 Event Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1687--1698",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Semi- supervised sound event detection (SSED) task
                 requires recognizing the categories of events and
                 marking each event's onset and offset times in a mixed
                 audio recording using a small amount of weakly labeled
                 and a large scale of unlabeled data. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xuehao Zhou and Mingyang Zhang and Yi Zhou and
                 Zhizheng Wu and Haizhou Li",
  title =        "Accented Text-to-Speech Synthesis With Limited Data",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1699--1711",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This paper presents an accented text-to-speech (TTS)
                 synthesis framework with limited training data. We
                 study two aspects concerning accent rendering: phonetic
                 (phoneme difference) and prosodic (pitch pattern and
                 phoneme duration) variations. The proposed \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Vinay Kothapally and John H. L. Hansen",
  title =        "Monaural Speech Dereverberation Using Deformable
                 Convolutional Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1712--1723",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Reverberation and background noise can degrade speech
                 quality and intelligibility when captured by a distant
                 microphone. In recent years, researchers have developed
                 several deep learning (DL)-based single-channel speech
                 dereverberation systems that aim to \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Taihui Wang and Feiran Yang and Jun Yang",
  title =        "Multichannel Linear Prediction-Based Speech
                 Dereverberation Considering Sparse and Low-Rank
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1724--1735",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "This article addresses the multi-channel linear
                 prediction (MCLP)-based speech dereverberation problem
                 by jointly considering the sparsity and low-rank priors
                 of speech spectrograms. We utilize the complex
                 generalized Gaussian (CGG) distribution as the
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Saurabh Kataria and Jes{\'u}s Villalba and Laureano
                 Moro-Vel{\'a}zquez and Piotr {\.Z}elasko and Najim
  title =        "Time-Domain Speech Super-Resolution With {GAN} Based
                 Modeling for Telephony Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1736--1749",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Automatic Speaker Verification(ASV) technology has
                 become commonplace in virtual assistants. However, its
                 performance suffers when there is a mismatch between
                 the train and test domains. Mixed bandwidth training,
                 i.e., pooling training data from both \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Marco Olivieri and Amy Bastine and Mirco Pezzoli and
                 Fabio Antonacci and Thushara Abhayapala and Augusto
  title =        "Acoustic Imaging With Circular Microphone Array: a New
                 Approach for Sound Field Analysis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1750--1761",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Acoustic imaging is powerful in collecting spatial
                 information of acoustic sources into a visual
                 representation. In this paper, we focus on the analysis
                 of the exterior acoustic field captured by a circular
                 array of microphones. With a proper \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Tengfei Liu and Yongli Hu and Junbin Gao and Yanfeng
                 Sun and Baocai Yin",
  title =        "Hierarchical Multi-Granularity Interaction Graph
                 Convolutional Network for Long Document
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1762--1775",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "With the growing demand for text analytics, long
                 document classification (LDC) has received extensive
                 attention, and great progress has been made. To reveal
                 the complex structure and extract the intrinsic
                 feature, the current approaches focus on modeling
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Douglas O'Shaughnessy",
  title =        "Review of Methods for Automatic Speaker Verification",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1776--1789",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "A review of techniques to identify speakers from their
                 voices is presented, noting strengths and weaknesses of
                 various methods. Similar acoustic analysis has been
                 often used for both speech and speaker recognition,
                 despite the two tasks being quite \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Etienne Thuillier and Craig T. Jin and Vesa
  title =        "{HRTF} Interpolation Using a Spherical Neural Process
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1790--1802",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Several individualization methods have recently been
                 proposed to estimate a subject's Head-Related Transfer
                 Function (HRTF) using convenient input modalities such
                 as anthropometric measurements or pinnae photographs.
                 There exists a need for \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Xun Gong and Yu Wu and Jinyu Li and Shujie Liu and Rui
                 Zhao and Xie Chen and Yanmin Qian",
  title =        "Advanced Long-Content Speech Recognition With
                 Factorized Neural Transducer",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1803--1815",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Long- content automatic speech recognition (ASR) has
                 obtained increasing interest in recent years, as it
                 captures the relationship among consecutive historical
                 utterances while decoding the current utterance. In
                 this paper, we propose two novel approaches, \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yoshiki Masuyama and Kouei Yamaoka and Takao Kawamura
                 and Nobutaka Ono",
  title =        "Efficient Joint Optimization of Sampling Rate Offsets
                 Using Entire Multichannel Signal",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1816--1828",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "In this paper, we propose a joint estimation method
                 for the sampling rate offsets (SROs) of multiple
                 recording devices. In wireless acoustic sensor
                 networks, distributed microphones are connected to
                 different analog-to-digital converters, and thus SROs
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Takaaki Saeki and Soumi Maiti and Xinjian Li and
                 Shinji Watanabe and Shinnosuke Takamichi and Hiroshi
  title =        "Text-Inductive Graphone-Based Language Adaptation for
                 Low-Resource Speech Synthesis",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1829--1844",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Neural text-to-speech (TTS) systems have made
                 significant progress in generating natural synthetic
                 speech. However, neural TTS requires large amounts of
                 paired training data, which limits its applicability to
                 a small number of resource-rich languages. \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yingming Gao and Peter Birkholz and Ya Li",
  title =        "Articulatory Copy Synthesis Based on the Speech
                 Synthesizer {VocalTractLab} and Convolutional Recurrent
                 Neural Networks",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1845--1858",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Articulatory copy synthesis (ACS) refers to the
                 synthetic reproduction of natural utterances. The
                 existing methods of ACS have the limitations of poor
                 generalizability for unknown speakers, high computing
                 costs, the lack of systematic evaluation, etc.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Th{\'e}o Mariotte and Anthony Larcher and Silvio
                 Montr{\'e}sor and Jean-Hugh Thomas",
  title =        "Channel-Combination Algorithms for Robust Distant
                 Voice Activity and Overlapped Speech Detection",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1859--1872",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Voice Activity Detection (VAD) and Overlapped Speech
                 Detection (OSD) are key pre-processing tasks for
                 speaker diarization. In the meeting context, it is
                 often easier to capture speech with a distant device.
                 This consideration however leads to severe \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Luciana M. X. de Souza and M{\'a}rcio H. Costa and
                 Renata Coelho Borges",
  title =        "Envelope-Based Multichannel Noise Reduction for
                 Cochlear Implant Applications",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1873--1884",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Cochlear implants (CI) are implantable electronic
                 prostheses that aim to restore communication in people
                 with severe to profound hearing loss. This is achieved
                 by transforming the acoustic signals into electrical
                 stimuli and applying them directly to the \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Linjian Li and Yi Cai and Xin Wu",
  title =        "Unsupervised Disentanglement Learning Model for
                 Exemplar-Guided Paraphrase Generation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1885--1900",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Exemplar- guided paraphrase generation is the task of
                 generating a paraphrase for a source sentence when
                 given another exemplar sentence as syntactic guidance
                 information. The target sentence must convey the
                 semantics of the source sentence in surface form,.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Amir Ivry and Israel Cohen and Baruch Berdugo",
  title =        "A User-Centric Approach for Deep Residual-Echo
                 Suppression in Double-Talk",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1901--1914",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "We introduce a user-centric residual-echo suppression
                 (URES) framework in double-talk. This framework
                 receives a user operating point (UOP) that consists of
                 two metric values: the residual echo suppression level
                 (RESL) and the desired speech-maintained \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Geng Zhang and Jin Liu and Guangyou Zhou and Kunsong
                 Zhao and Zhiwen Xie and Bo Huang",
  title =        "Question-Directed Reasoning With Relation-Aware Graph
                 Attention Network for Complex Question Answering Over
                 Knowledge Graph",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1915--1927",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Complex knowledge graph question answering (KGQA) aims
                 at answering natural language questions by entities
                 retrieving from a knowledge graph (KG). Recently, the
                 relation path-based models have shown the unique
                 advantage for complex KGQA. However, these \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Yu Yao and Peng Yang and Guangzhen Zhao and Guoshun
  title =        "{KGAgent}: Learning a Deep Reinforced Agent for
                 Keyphrase Generation",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1928--1940",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Keyphrase generation (KG) is an essential problem in
                 many natural language processing (NLP) tasks. Deep
                 learning keyphrase generation methods often combine the
                 copy and generating action-aware probabilities to model
                 keyphrase accuracy, ignoring the copy \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Jiahong Li and Chenda Li and Yifei Wu and Yanmin
  title =        "Unified Cross-Modal Attention: Robust Audio-Visual
                 Speech Recognition and Beyond",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1941--1953",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Audio- Visual Speech Recognition (AVSR) is a promising
                 approach to improving the accuracy and robustness of
                 speech recognition systems with the assistance of
                 visual cues in challenging acoustic environments. In
                 this paper, we present a novel audio-visual \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Mieszko Fra{\'s} and Konrad Kowalczyk",
  title =        "Reverberant Source Separation Using {NTF} With Delayed
                 Subsources and Spatial Priors",
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1954--1967",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Speech signals recorded by distant microphones are
                 often contaminated with room reverberation and signals
                 of interfering speakers. This article addresses the
                 problem of joint source separation and dereverberation
                 using multichannel nonnegative tensor \ldots{}",
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

  author =       "Rui Wang and Li Li and Tomoki Toda",
  title =        "Dual-Channel Target Speaker Extraction Based on
                 Conditional Variational Autoencoder and Directional
  journal =      j-IEEE-ACM-TASLP,
  volume =       "32",
  number =       "??",
  pages =        "1968--1979",
  year =         "2024",
  DOI =          "",
  ISSN =         "2329-9290",
  bibdate =      "Fri Apr 12 09:07:41 MDT 2024",
  bibsource =    "",
  URL =          "",
  abstract =     "Target speaker extraction (TSE) has become an
                 attractive research topic in recent years. However, TSE
                 under the underdetermined conditions is still a
                 challenge. In this paper, we deal with a dual-channel
                 TSE problem under underdetermined conditions.
  acknowledgement = ack-nhfb,
  fjournal =     "IEEE\slash ACM Transactions on Audio, Speech, and
                 Language Processing",
  journal-URL =  ";

%%% [27-May-2021] TO DO: ACM has only 30 articles in volume 28, but IEEE shows 180!
%%% [07-Apr-2022] v30 is incomplete (full year coverage)
%%% [17-May-2023] Check contents for most recent volume: additions are made during the year; also fix bibsource data