%%% -*-BibTeX-*- %%% ==================================================================== %%% BibTeX-file{ %%% author = "Nelson H. F. Beebe", %%% version = "1.17", %%% date = "12 April 2024", %%% time = "09:42:59 MST", %%% filename = "ieeeacmtaslp.bib", %%% address = "University of Utah %%% Department of Mathematics, 110 LCB %%% 155 S 1400 E RM 233a %%% Salt Lake City, UT 84112-0090 %%% USA", %%% telephone = "+1 801 581 5254", %%% FAX = "+1 801 581 4148", %%% URL = "https://www.math.utah.edu/~beebe", %%% checksum = "50257 65862 250970 2818881", %%% email = "beebe at math.utah.edu, beebe at acm.org, %%% beebe at computer.org (Internet)", %%% codetable = "ISO/ASCII", %%% keywords = "bibliography; BibTeX; IEEE/ACM Transactions %%% on Audio, Speech, and Language Processing", %%% license = "public domain", %%% supported = "yes", %%% docstring = "This is a COMPLETE bibliography of the %%% journal IEEE/ACM Transactions on Audio, %%% Speech, and Language Processing (CODEN none, %%% ISSN 2329-9290). The journal began publishing %%% in 2014 as the merger of the journals ACM %%% Transactions on Speech and Language %%% Processing (TSLP) (2004--2013) and IEEE %%% Transactions on Audio, Speech, and Language %%% Processing (2006--2013). The initial volume %%% of the merged journal is 22, continuing the %%% numbering of the IEEE parent journal. %%% %%% The journal has Web sites at %%% %%% https://dl.acm.org/loi/taslp %%% http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655 %%% %%% At version 1.17, the COMPLETE journal %%% coverage looked like this: %%% %%% 2014 ( 298) 2018 ( 276) 2022 ( 121) %%% 2015 ( 292) 2019 ( 209) 2023 ( 311) %%% 2016 ( 265) 2020 ( 60) 2024 ( 155) %%% 2017 ( 275) 2021 ( 292) %%% %%% Article: 2554 %%% %%% Total entries: 2554 %%% %%% The checksum field above contains a CRC-16 %%% checksum as the first value, followed by the %%% equivalent of the standard UNIX wc (word %%% count) utility output of lines, words, and %%% characters. This is produced by Robert %%% Solovay's checksum utility.", %%% } %%% ==================================================================== @Preamble{ "\input bibnames.sty" # "\ifx \undefined \dbar \def \dbar {\leavevmode\raise0.2ex\hbox{--}\kern-0.5emd} \fi" # "\ifx \undefined \Dbar \def \Dbar {\leavevmode\raise0.2ex\hbox{--}\kern-0.5emD} \fi" # "\ifx \undefined \ocirc \def \ocirc #1{{\accent'27#1}}\fi" # "\ifx \undefined \r \def \r #1{\ocirc{#1}} \fi" } %%% ==================================================================== %%% Acknowledgement abbreviations: @String{ack-nhfb = "Nelson H. F. Beebe, University of Utah, Department of Mathematics, 110 LCB, 155 S 1400 E RM 233, Salt Lake City, UT 84112-0090, USA, Tel: +1 801 581 5254, FAX: +1 801 581 4148, e-mail: \path|beebe@math.utah.edu|, \path|beebe@acm.org|, \path|beebe@computer.org| (Internet), URL: \path|https://www.math.utah.edu/~beebe/|"} %%% ==================================================================== %%% Journal abbreviations: @String{j-IEEE-ACM-TASLP = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing"} %%% ==================================================================== %%% Bibliography entries, sorted in publication order: @Article{Anonymous:2014:TCa, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "1--2", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2295965", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCb, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "3--4", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2295968", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Deng:2014:EET, author = "L. Deng and S. Renals and M. Federico and M. Ostendorf", title = "Editorial: Expanding the Technical Reach of our Transactions", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "5--5", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2290172", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Taghia:2014:OIM, author = "J. Taghia and R. Martin", title = "Objective Intelligibility Measures Based on Mutual Information for Speech Subjected to Speech Enhancement Processing", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "6--16", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASL.2013.2281574", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lu:2014:CLS, author = "Liang Lu and A. Ghoshal and S. Renals", title = "Cross-Lingual Subspace {Gaussian} Mixture Models for Low-Resource Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "17--27", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASL.2013.2281575", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gasic:2014:GPP, author = "M. Gasic and S. Young", title = "{Gaussian} Processes for {POMDP}-Based Dialogue Manager Optimization", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "28--40", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASL.2013.2282190", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mezghani-Marrakchi:2014:NAS, author = "I. Mezghani-Marrakchi and G. Mahe and S. Djaziri-Larbi and M. Jaidane and M. Turki-Hadj Alouane", title = "Nonlinear Audio Systems Identification Through Audio Input {Gaussianization}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "41--53", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASL.2013.2282214", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Crespo:2014:MSR, author = "J. B. Crespo and R. C. Hendriks", title = "Multizone Speech Reinforcement", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "54--66", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASL.2013.2283100", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pan:2014:PSM, author = "Chao Pan and Jingdong Chen and J. Benesty", title = "Performance Study of the {MVDR} Beamformer as a Function of the Source Incidence Angle", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "67--79", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASL.2013.2283104", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lee:2014:ISR, author = "Hung-yi Lee and Lin-shan Lee", title = "Improved Semantic Retrieval of Spoken Content by Document\slash Query Expansion with Random Walk Over Acoustic Similarity Graphs", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "80--94", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2285469", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Leutnant:2014:NOM, author = "V. Leutnant and A. Krueger and R. Haeb-Umbach", title = "A New Observation Model in the Logarithmic Mel Power Spectral Domain for the Automatic Recognition of Noisy Reverberant Speech", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "95--109", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2285480", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2014:CPT, author = "N. F. Chen and S. W. Tam and Wade Shen and J. P. Campbell", title = "Characterizing Phonetic Transformations and Acoustic Differences Across {English} Dialects", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "110--124", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2285482", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Markovic:2014:EAR, author = "D. Markovic and K. Kowalczyk and F. Antonacci and C. Hofmann and A. Sarti and W. Kellermann", title = "Estimation of Acoustic Reflection Coefficients Through Pseudospectrum Matching", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "125--137", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2285483", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Duan:2014:MPS, author = "Zhiyao Duan and Jinyu Han and B. Pardo", title = "Multi-pitch Streaming of Harmonic Sound Mixtures", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "138--150", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2285484", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2014:TVW, author = "Shilin Liu and Khe Chai Sim", title = "Temporally Varying Weight Regression: A Semi-Parametric Trajectory Model for Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "151--160", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2285487", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tomar:2014:FDM, author = "V. S. Tomar and R. C. Rose", title = "A Family of Discriminative Manifold Learning Algorithms and Their Application to Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "161--171", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2286906", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Doi:2014:ASE, author = "H. Doi and T. Toda and K. Nakamura and H. Saruwatari and K. Shikano", title = "Alaryngeal Speech Enhancement Based on One-to-Many Eigenvoice Conversion", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "172--183", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2286917", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Arisoy:2014:CNN, author = "E. Arisoy and S. F. Chen and B. Ramabhadran and A. Sethy", title = "Converting Neural Network Language Models into Back-off Language Models for Efficient Decoding in Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "184--192", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2286919", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jin:2014:DOE, author = "C. T. Jin and N. Epain and A. Parthy", title = "Design, Optimization and Evaluation of a Dual-Radius Spherical Microphone Array", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "193--204", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2286920", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mignot:2014:LFI, author = "R. Mignot and G. Chardon and L. Daudet", title = "Low Frequency Interpolation of Room Impulse Responses Using Compressed Sensing", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "205--216", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2286922", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Senoussaoui:2014:SCD, author = "M. Senoussaoui and P. Kenny and T. Stafylakis and P. Dumouchel", title = "A Study of the Cosine Distance-Based Mean Shift for Telephone Speech Diarization", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "217--227", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2285474", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tachibana:2014:SVE, author = "H. Tachibana and N. Ono and S. Sagayama", title = "Singing Voice Enhancement in Monaural Music Signals Based on Two-stage Harmonic\slash Percussive Sound Separation on Multiple Resolution Spectrograms", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "228--237", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2287052", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shabtai:2014:GSA, author = "N. R. Shabtai and B. Rafaely", title = "Generalized Spherical Array Beamforming for Binaural Speech Reproduction", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "238--247", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2290499", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cumani:2014:FSS, author = "S. Cumani and P. Laface", title = "Factorized Sub-Space Estimation for Fast and Memory Effective {$I$}-vector Extraction", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "248--259", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2290505", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zeng:2014:DDS, author = "Yuan Zeng and R. C. Hendriks", title = "Distributed Delay and Sum Beamformer for Speech Enhancement via Randomized Gossip", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "260--273", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2290861", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2014:JOC, author = "Zhenghua Li and Min Zhang and Wanxiang Che and Ting Liu and Wenliang Chen", title = "Joint Optimization for {Chinese} {POS} Tagging and Dependency Parsing", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "274--286", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2288081", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATa, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing --- EDICS}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "289--290", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300354", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATb, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "291--292", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300353", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:OAa, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "293--293", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300352", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPa, author = "Anonymous", title = "[{Blank} page]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "B287--B288", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300362", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:FCa, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "C1", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2298102", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATc, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "C2", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300774", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:ISPa, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "C3", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2301051", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPBa, author = "Anonymous", title = "[{Blank} page --- back cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "1", pages = "C4", month = jan, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300363", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCc, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "289--290", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300331", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCd, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "291--292", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300411", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gao:2014:SSF, author = "Dehong Gao and Wenjie Li and Xiaoyan Cai and Renxian Zhang and You Ouyang", title = "Sequential Summarization: a Full View of {Twitter} Trending Topics", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "293--302", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASL.2013.2282191", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{vanHengel:2014:CST, author = "P. W. J. van Hengel and J. D. Krijnders", title = "A Comparison of Spectro-Temporal Representations of Audio Signals", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "303--313", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASL.2013.2283105", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zitouni:2014:APC, author = "I. Zitouni and Y. Benajiba", title = "Aligned-Parallel-Corpora Based Semi-Supervised Learning for {Arabic} Mention Detection", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "314--324", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2287055", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Molina:2014:DRP, author = "E. Molina and A. M. Barbancho and L. J. Tardon and I. Barbancho", title = "Dissonance Reduction In Polyphonic Audio Using Harmonic Reorganization", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "325--334", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2287056", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lun:2014:NEM, author = "D. P. K. Lun and Tak-Wai Shen and K. C. Ho", title = "A Novel Expectation-Maximization Framework for Speech Enhancement in Non-Stationary Noise Environments", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "335--346", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2290497", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cosentino:2014:CIF, author = "S. Cosentino and T. H. Falk and D. McAlpine and T. Marquardt", title = "Cochlear Implant Filterbank Design and Optimization: A Simulation Study", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "347--353", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2290502", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Souden:2014:LFI, author = "M. Souden and K. Kinoshita and M. Delcroix and T. Nakatani", title = "Location Feature Integration for Clustering-Based Speech Separation in Distributed Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "354--367", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2292308", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kallasjoki:2014:EUI, author = "H. Kallasjoki and J. F. Gemmeke and K. J. Palomaki", title = "Estimating Uncertainty to Improve Exemplar-Based Feature Enhancement for Noise Robust Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "368--380", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2292328", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hasan:2014:MLA, author = "T. Hasan and J. H. L. Hansen", title = "Maximum Likelihood Acoustic Factor Analysis Models for Robust Speaker Verification in Noise", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "381--391", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2292356", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schwartz:2014:STU, author = "O. Schwartz and S. Gannot", title = "Speaker Tracking Using Recursive {EM} Algorithms", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "392--402", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2292361", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tsao:2014:MBO, author = "Yu Tsao and S. Matsuda and C. Hori and H. Kashioka and Chin-Hui Lee", title = "A {MAP}-based Online Estimation Approach to Ensemble Speaker and Speaking Environment Modeling", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "403--416", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2292362", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hui:2014:LSA, author = "Pui-Yu Hui and H. Meng", title = "Latent Semantic Analysis for Multimodal User Input With Speech and Gestures", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "417--429", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2294586", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jensen:2014:SIP, author = "J. Jensen and C. H. Taal", title = "Speech Intelligibility Prediction Based on Mutual Information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "430--440", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2295914", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Primavera:2014:OSI, author = "A. Primavera and S. Cecchi and Junfeng Li and F. Piazza", title = "Objective and Subjective Investigation on a Novel Method for Digital Reverberator Parameters Estimation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "441--452", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2295925", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Speed:2014:MVT, author = "M. Speed and D. Murphy and D. Howard", title = "Modeling the Vocal Tract Transfer Function Using a {$3$D} Digital Waveguide Mesh", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "453--464", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2294579", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hacihabiboglu:2014:TAO, author = "H{\"u}seyim Hac{\i}habibo{\u{g}}lu", title = "Theoretical Analysis of Open Spherical Microphone Arrays for Acoustic Intensity Measurements", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "465--476", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2294581", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cho:2014:RII, author = "Taemin Cho and J. P. Bello", title = "On the Relative Importance of Individual Components of Chord Recognition Systems", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "477--492", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2295926", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Otsuka:2014:BNM, author = "T. Otsuka and K. Ishiguro and H. Sawada and H. G. Okuno", title = "{Bayesian} Nonparametrics for Microphone Array Processing", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "493--504", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2294582", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{He:2014:LEB, author = "Jianjun He and Ee-Leng Tan and Woon-Seng Gan", title = "Linear Estimation Based Primary-Ambient Extraction for Stereo Audio Signals", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "505--517", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2297015", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gonzalez:2014:PPE, author = "S. Gonzalez and M. Brookes", title = "{PEFAC} --- A Pitch Estimation Algorithm Robust to High Levels of Noise", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "518--530", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2295918", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2014:BCC, author = "Min Zhang and Xiangyu Duan and Wenliang Chen", title = "{Bayesian} Constituent Context Model for Grammar Induction", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "531--541", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2294584", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chang:2014:FAN, author = "Dah-Chung Chang and Fei-Tao Chu", title = "Feedforward Active Noise Control With a New Variable Tap-Length and Step-Size Filtered-{X} {LMS} Algorithm", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "542--555", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2297016", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{McVicar:2014:ACE, author = "M. McVicar and R. Santos-Rodriguez and Yizhao Ni and Tijl {De Bie}", title = "Automatic Chord Estimation from Audio: a Review of the State of the Art", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "556--575", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2294580", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATd, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} --- {EDICS}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "576--577", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300358", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATe, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "578--579", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300357", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:OAb, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "580--580", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300351", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:FCb, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "C1", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300374", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATf, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "C2", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300775", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:ISPb, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "C3", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2301052", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPBb, author = "Anonymous", title = "[{Blank} page --- back cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "2", pages = "C4", month = feb, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300361", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:30 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCe, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "581--582", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2307456", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCf, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "583--584", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2307457", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2014:SSS, author = "Chung-Hsien Wu and Yi-Chin Huang and Chung-Han Lee and Jun-Cheng Guo", title = "Synthesis of Spontaneous Speech With Syllable Contraction Using State-Based Context-Dependent Voice Transformation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "585--595", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2297018", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Airaksinen:2014:QCP, author = "M. Airaksinen and T. Raitio and B. Story and P. Alku", title = "Quasi Closed Phase Glottal Inverse Filtering Analysis With Weighted Linear Prediction", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "596--607", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2294585", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2014:OSD, author = "Jae-Mo Yang and Hong-Goo Kang", title = "Online Speech Dereverberation Algorithm Based on Adaptive Multichannel Linear Prediction", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "608--619", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2294578", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Asaei:2014:SSM, author = "A. Asaei and M. Golbabaee and H. Bourlard and V. Cevher", title = "Structured Sparsity Models for Reverberant Speech Separation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "620--633", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2297012", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rashobh:2014:MEK, author = "R. S. Rashobh and A. W. H. Khong and Di Liu", title = "Multichannel Equalization in the {KLT} and Frequency Domains With Application to Speech Dereverberation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "634--646", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2013.2297013", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Samarasinghe:2014:WAL, author = "P. Samarasinghe and T. Abhayapala and M. Poletti", title = "Wavefield Analysis Over Large Areas Using Distributed Higher Order Microphones", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "647--658", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300341", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wei:2014:EPF, author = "Wen-Li Wei and Chung-Hsien Wu and Jen-Chun Lin and Han Li", title = "Exploiting Psychological Factors for Interaction Style Recognition in Spoken Conversation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "659--671", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300339", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Raczynski:2014:GBM, author = "S. A. Raczy{\'n}ski and E. Vincent", title = "Genre-Based Music Language Modeling with Latent Hierarchical {Pitman}-Yor Process Allocation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "672--681", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300344", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2014:TCS, author = "Dalei Wu and Wei-Ping Zhu and M. N. S. Swamy", title = "The Theory of Compressive Sensing Matching Pursuit Considering Time-domain Noise with Application to Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "682--696", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2300336", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nanjundaswamy:2014:CLT, author = "T. Nanjundaswamy and K. Rose", title = "Cascaded Long Term Prediction for Enhanced Compression of Polyphonic Audio Signals", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "697--710", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2303292", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Audhkhasi:2014:TAD, author = "K. Audhkhasi and A. M. Zavou and P. G. Georgiou and S. S. Narayanan", title = "Theoretical Analysis of Diversity in an Ensemble of Automatic Speech Recognition Systems", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "711--726", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2303295", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nikunen:2014:DAB, author = "J. Nikunen and T. Virtanen", title = "Direction of Arrival Based Spatial Covariance Model for Blind Sound Source Separation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "727--739", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2303576", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATg, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "741--742", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311613", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATh, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "743--744", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311612", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:OAc, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "745--745", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2312837", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:PYAa, author = "Anonymous", title = "Publish your article in {IEEE Access}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "746--746", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2312836", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPc, author = "Anonymous", title = "[{Blank} page]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "B740", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311572", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:FCc, author = "Anonymous", title = "[{Front} cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "C1", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311576", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATi, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "C2", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311615", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:ISPc, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "C3", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311614", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPBc, author = "Anonymous", title = "[{Blank} page --- back cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "3", pages = "C4", month = mar, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311573", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:36 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCg, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "741--742", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2312758", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCh, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "743--744", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2312798", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2014:ONR, author = "Jinyu Li and Li Deng and Yifan Gong and R. Haeb-Umbach", title = "An Overview of Noise-Robust Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "745--777", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2304637", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sarikaya:2014:ADB, author = "R. Sarikaya and G. E. Hinton and A. Deoras", title = "Application of Deep Belief Networks for Natural Language Understanding", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "778--784", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2303296", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Serizel:2014:LRA, author = "R. Serizel and M. Moonen and B. {Van Dijk} and J. Wouters", title = "Low-rank Approximation Based Multichannel {Wiener} Filter Algorithms for Noise Reduction with Application in Cochlear Implants", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "785--799", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2304240", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Crocco:2014:DSP, author = "M. Crocco and A. Trucco", title = "Design of Superdirective Planar Arrays With Sparse Aperiodic Layouts for Processing Broadband Signals via {$3$-D} Beamforming", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "800--815", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2304635", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zapata:2014:MFB, author = "J. R. Zapata and M. E. P. Davies and E. Gomez", title = "Multi-Feature Beat Tracking", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "816--825", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2305252", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Narayanan:2014:ISS, author = "A. Narayanan and Deliang Wang", title = "Investigation of Speech Separation as a Front-End for Noise Robust Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "826--835", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2305833", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2014:RSI, author = "Xiaojia Zhao and Yuxuan Wang and Deliang Wang", title = "Robust Speaker Identification in Noisy and Reverberant Conditions", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "836--845", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2308398", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cumani:2014:UVP, author = "S. Cumani and O. Plchot and P. Laface", title = "On the use of $i$-vector posterior distributions in Probabilistic Linear Discriminant Analysis", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "846--857", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2308473", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2014:CEP, author = "Chung-Hsien Wu and Han-Ping Shen and Yan-Ting Yang", title = "{Chinese--English} Phone Set Construction for Code-Switching {ASR} Using Acoustic and {DNN}-Extracted Articulatory Features", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "858--862", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2310353", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATj, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "863--864", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311617", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATk, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "865--866", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311616", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:OAd, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "867--867", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2312839", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:PYAb, author = "Anonymous", title = "Publish your article in {IEEE Access}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "868--868", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2312838", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:FCd, author = "Anonymous", title = "[{Front} cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "C1", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311593", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATl, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "C2", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311619", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:ISPd, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "C3", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311618", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPBd, author = "Anonymous", title = "[{Blank} page --- back cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "4", pages = "C4", month = apr, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311575", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCi, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "869--870", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2320471", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCj, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "871--872", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2321252", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2014:DTS, author = "Weibin Zhang and P. Fung", title = "Discriminatively Trained Sparse Inverse Covariance Matrices for Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "873--882", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2312548", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lee:2014:SKO, author = "Hung-yi Lee and Sz-Rung Shiang and Ching-Feng Yeh and Yun-Nung Chen and Yu Huang and Sheng-Yi Kong and Lin-shan Lee", title = "Spoken Knowledge Organization by Semantic Structuring and a Prototype Course Lecture System for Personalized Learning", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "883--898", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2310993", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zao:2014:SEE, author = "L. Z{\~a}o and R. Coelho and P. Flandrin", title = "Speech Enhancement with {EMD} and {Hurst}-Based Mode Selection", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "899--911", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2312541", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Giacobello:2014:SNE, author = "D. Giacobello and M. G. Christensen and T. L. Jensen and M. N. Murthi and S. H. Jensen and M. Moonen", title = "Stable $1$-Norm Error Minimization Based Linear Predictors for Speech Modeling", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "912--922", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311324", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lacouture-Parodi:2014:MNR, author = "Y. Lacouture-Parodi and E. A. P. Habets and Jingdong Chen and J. Benesty", title = "Multichannel Noise Reduction in the {Karhunen--Lo{\`e}ve} Expansion Domain", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "923--936", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311299", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sadjadi:2014:BSW, author = "S. O. Sadjadi and J. H. L. Hansen", title = "Blind Spectral Weighting for Robust Speaker Identification under Reverberation Mismatch", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "937--945", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311329", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mantena:2014:QES, author = "G. Mantena and S. Achanta and K. Prahallad", title = "Query-by-Example Spoken Term Detection using Frequency Domain Linear Prediction and Non-Segmental Dynamic Time Warping", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "946--955", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311322", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Osterwise:2014:DFD, author = "C. Osterwise and S. L. Grant", title = "On Over-Determined Frequency Domain {BSS}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "956--966", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2307166", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jarrett:2014:NRS, author = "D. P. Jarrett and M. Taseska and E. A. P. Habets and P. A. Naylor", title = "Noise Reduction in the Spherical Harmonic Domain Using a Tradeoff Beamformer and Narrowband {DOA} Estimates", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "967--978", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311925", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rieser:2014:NLG, author = "V. Rieser and O. Lemon and S. Keizer", title = "Natural Language Generation as Incremental Planning Under Uncertainty: Adaptive Information Presentation for Statistical Dialogue Systems", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "979--994", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASL.2014.2315271", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cheer:2014:CCP, author = "J. Cheer and S. J. Elliott", title = "Comments on {``Complete Parallel Narrowband Active Noise Control Systems''}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "995--996", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2311319", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATm, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "999--1000", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2325659", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATn, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "1001--1002", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2325660", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPd, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "B997--B998", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2325663", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:FCe, author = "Anonymous", title = "[{Front} cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "C1", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2321652", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATo, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "C2", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2325657", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:ISPe, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "C3", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2325658", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPBe, author = "Anonymous", title = "[{Blank} page --- back cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "5", pages = "C4", month = may, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2325664", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:37 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCk, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "999--1000", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2324091", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCl, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "1001--1002", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2324211", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Arora:2014:MSC, author = "V. Arora and L. Behera", title = "Musical Source Clustering and Identification in Polyphonic Audio", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "1003--1012", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2313404", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nongpiur:2014:DMB, author = "R. C. Nongpiur", title = "Design of Minimax Broadband Beamformers that are Robust to Microphone Gain, Phase, and Position Errors", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "1013--1022", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2315044", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Venkitaraman:2014:BSP, author = "A. Venkitaraman and C. S. Seelamantula", title = "Binaural Signal Processing Motivated Generalized Analytic Signal Construction and {AM--FM} Demodulation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "1023--1036", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2316376", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Geiger:2014:MEN, author = "J. T. Geiger and F. Weninger and J. F. Gemmeke and M. Wollmer and B. Schuller and G. Rigoll", title = "Memory-Enhanced Neural Networks and {NMF} for Robust {ASR}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "1037--1046", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2318514", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2014:MPA, author = "Haiquan Zhao and Yi Yu and Shibin Gao and Xiangping Zeng and Zhengyou He", title = "Memory Proportionate {APA} with Individual Activation Factors for Acoustic Echo Cancellation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "1047--1055", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2318519", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gangeh:2014:MSD, author = "M. J. Gangeh and P. Fewzee and A. Ghodsi and M. S. Kamel and F. Karray", title = "Multiview Supervised Dictionary Learning in Speech Emotion Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "1056--1068", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2319157", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Choi:2014:DMV, author = "Jae-Hun Choi and Joon-Hyuk Chang", title = "Dual-Microphone Voice Activity Detection Technique Based on Two-Step Power Level Difference Ratio", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "1069--1081", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2313917", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Alameda-Pineda:2014:GAS, author = "X. Alameda-Pineda and R. Horaud", title = "A Geometric Approach to Sound Source Localization from Time-Delay Estimates", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "1082--1095", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2317989", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Reindl:2014:MMI, author = "K. Reindl and S. Meier and H. Barfuss and W. Kellermann", title = "Minimum Mutual Information-Based Linearly Constrained Broadband Signal Extraction", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "1096--1108", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2319155", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATp, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "1109--1110", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2325655", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATq, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "1111--1112", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2325656", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:FCf, author = "Anonymous", title = "[{Front} cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "C1", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2321651", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATr, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "C2", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2325653", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:ISPf, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "C3", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2325654", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPBf, author = "Anonymous", title = "[{Blank} page --- back cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "6", pages = "C4", month = jun, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2325665", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCm, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "1113--1114", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2331931", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCn, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "1115--1116", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2332931", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bahari:2014:NNF, author = "M. H. Bahari and N. Dehak and H. {Van hamme} and L. Burget and A. M. Ali and J. Glass", title = "Non-Negative Factor Analysis of {Gaussian} Mixture Model Weight Adaptation for Language and Dialect Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "1117--1129", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2319159", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bao:2014:LDD, author = "Guangzhao Bao and Yangfei Xu and Zhongfu Ye", title = "Learning a Discriminative Dictionary for Single-Channel Speech Separation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "1130--1138", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2320575", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kelly:2014:DAR, author = "I. J. Kelly and F. M. Boland", title = "Detecting Arrivals in Room Impulse Responses With Dynamic Time Warping", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "1139--1147", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2321472", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Guldenschuh:2014:DSP, author = "M. Guldenschuh and R. de Callafon", title = "Detection of Secondary-Path Irregularities in Active Noise Control Headphones", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "1148--1157", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2321475", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2014:MSR, author = "Sin-Horng Chen and Chiao-Hua Hsieh and Chen-Yu Chiang and Hsi-Chun Hsiao and Yih-Ru Wang and Yuan-Fu Liao and Hsiu-Min Yu", title = "Modeling of Speaking Rate Influences on {Mandarin} Speech Prosody and Its Application to Speaking Rate-controlled {TTS}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "1158--1171", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2321482", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Comminiello:2014:NAE, author = "D. Comminiello and M. Scarpiniti and L. A. Azpicueta-Ruiz and J. Arenas-Garcia and A. Uncini", title = "Nonlinear Acoustic Echo Cancellation Based on Sparse Functional Link Representations", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "1172--1183", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2324175", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2014:TDS, author = "Wen Zhang and T. D. Abhayapala", title = "Three Dimensional Sound Field Reproduction using Multiple Circular Loudspeaker Arrays: Functional Analysis Guided Approach", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "1184--1194", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2324182", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Taseska:2014:ISF, author = "M. Taseska and E. A. P. Habets", title = "Informed Spatial Filtering for Sound Extraction Using Distributed Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "1195--1207", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2327294", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shen:2014:DPR, author = "Mo Shen and D. Kawahara and S. Kurohashi", title = "Dependency Parse Reranking with Rich Subtree Features", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "1208--1218", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2327295", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATs, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "1221--1222", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2340717", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATt, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "1223--1224", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2340718", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:OAe, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "1225--1225", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2340720", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPe, author = "Anonymous", title = "[{Blank} page]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "B1219--B1220", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2340723", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:FCg, author = "Anonymous", title = "[{Front} cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "C1", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2334814", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATu, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "C2", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2340711", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:ISPg, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "C3", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2340712", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPBg, author = "Anonymous", title = "[{Blank} page --- back cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "7", pages = "C4", month = jul, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2340722", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:38 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCo, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "1221--1222", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2339751", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCp, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "1223--1224", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2339771", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2014:IBD, author = "Zhibao Li and K. F. C. Yiu and S. Nordholm", title = "On the Indoor Beamformer Design With Reverberation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "1225--1235", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2327299", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hawes:2014:SAD, author = "M. B. Hawes and Wei Liu", title = "Sparse Array Design for Wideband Beamforming With Reduced Complexity in Tapped Delay-Lines", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "1236--1247", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2327298", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{FanChiang:2014:LCF, author = "Yi FanChiang and Cheng-Wen Wei and Yi-Le Meng and Yu-Wen Lin and Shyh-Jye Jou and Tian-Sheuan Chang", title = "Low Complexity Formant Estimation Adaptive Feedback Cancellation for Hearing Aids Using Pitch Based Processing", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "1248--1259", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2327300", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", note = "See correction \cite{FanChiang:2014:CLC}.", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Conan:2014:SMI, author = "S. Conan and O. Derrien and M. Aramaki and S. Ystad and R. Kronland-Martinet", title = "A Synthesis Model With Intuitive Control Capabilities for Rolling Sounds", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "1260--1273", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2327297", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schuldt:2014:DRE, author = "C. Schuldt and P. Handel", title = "Decay Rate Estimators and Their Performance for Blind Reverberation Time Estimation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "1274--1284", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2328174", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ganapathy:2014:RFE, author = "S. Ganapathy and S. H. Mallidi and H. Hermansky", title = "Robust Feature Extraction Using Modulation Filtering of Autoregressive Models", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "1285--1295", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2329190", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2014:SMA, author = "Bo Li and Khe Chai Sim", title = "A Spectral Masking Approach to Noise-Robust Speech Recognition Using Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "1296--1305", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2329237", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yilmaz:2014:NRE, author = "E. Yilmaz and J. F. Gemmeke and H. {Van hamme}", title = "Noise Robust Exemplar Matching Using Sparse Representations of Speech", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "1306--1319", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2329188", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schmid:2014:VBI, author = "D. Schmid and G. Enzner and S. Malik and D. Kolossa and R. Martin", title = "Variational {Bayesian} Inference for Multichannel Dereverberation and Noise Reduction", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "1320--1335", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2329732", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATv, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "1336--1337", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2340715", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATw, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "1338--1339", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2340716", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:OAf, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "1340--1340", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2340719", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:FCh, author = "Anonymous", title = "[{Front} cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "C1", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2340724", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATx, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "C2", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2340713", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:ISPh, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "C3", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2340714", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPBh, author = "Anonymous", title = "[{Blank} page --- back cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "8", pages = "C4", month = aug, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2340721", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCq, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1341--1342", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2351112", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCr, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1343--1344", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2351171", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Masiero:2014:FCD, author = "B. Masiero and M. Vorlander", title = "A Framework for the Calculation of Dynamic Crosstalk Cancellation Filters", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1345--1354", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2329184", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schasse:2014:ESS, author = "A. Schasse and R. Martin", title = "Estimation of Subband Speech Correlations for Noise Reduction via {MVDR} Processing", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1355--1365", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2329633", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Novotny:2014:AEA, author = "Michal Novotn{\'y} and Jan Rusz and Roman {\v{C}}mejla and Ev{\v{z}}en R{\r{u}}{\v{z}}i{\v{c}}ka", title = "Automatic Evaluation of Articulatory Disorders in {Parkinson}'s Disease", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1366--1378", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2329734", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lim:2014:RMD, author = "F. Lim and Wancheng Zhang and E. A. P. Habets and P. A. Naylor", title = "Robust Multichannel Dereverberation using Relaxed Multichannel Least Squares", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1379--1390", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2329632", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ghalehjegh:2014:LRB, author = "S. H. Ghalehjegh and R. C. Rose", title = "Linear Regression Based Acoustic Adaptation for the Subspace {Gaussian} Mixture Model", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1391--1402", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2332043", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Botts:2014:SPP, author = "J. Botts and L. Savioja", title = "Spectral and Pseudospectral Properties of Finite Difference Models Used in Audio and Room Acoustics", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1403--1412", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2332045", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xiang:2014:PBA, author = "Yong Xiang and I. Natgunanathan and Song Guo and Wanlei Zhou and S. Nahavandi", title = "Patchwork-Based Audio Watermarking Method Robust to De-synchronization Attacks", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1413--1423", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2328175", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{McLoughlin:2014:SAV, author = "I. V. McLoughlin", title = "Super-Audible Voice Activity Detection", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1424--1433", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2335055", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Alinaghi:2014:JMV, author = "A. Alinaghi and P. J. Jackson and Qingju Liu and Wenwu Wang", title = "Joint Mixing Vector and Binaural Model Based Stereo Source Separation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1434--1448", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2320637", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATy, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1451--1452", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359309", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATz, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1453--1454", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359310", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:OAg, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1455--1455", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359303", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TWAa, author = "Anonymous", title = "Together, we are advancing technology", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "1456--1456", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359304", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPf, author = "Anonymous", title = "[{Blank} page]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "B1449--B1450", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359300", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:FCi, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "C1", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2355651", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATaa, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "C2", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359297", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:ISPi, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "C3", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359298", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPBi, author = "Anonymous", title = "[{Blank} page --- back cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "9", pages = "C4", month = sep, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359308", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:39 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCs, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1451--1452", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2357971", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCt, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1453--1454", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2357931", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2014:DRD, author = "Liheng Zhao and J. Benesty and Jingdong Chen", title = "Design of Robust Differential Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1455--1466", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2337844", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jain:2014:EBM, author = "P. Jain and R. B. Pachori", title = "Event-Based Method for Instantaneous Fundamental Frequency Estimation from Voiced Speech Based on Eigenvalue Decomposition of the {Hankel} Matrix", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1467--1482", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2335056", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Vaizman:2014:CBA, author = "Y. Vaizman and B. McFee and G. Lanckriet", title = "Codebook-Based Audio Feature Representation for Music Information Retrieval", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1483--1493", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2337842", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nadiri:2014:LMS, author = "O. Nadiri and B. Rafaely", title = "Localization of Multiple Speakers under High Reverberation using a Spherical Microphone Array and the Direct-Path Dominance Test", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1494--1505", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2337846", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2014:EBS, author = "Zhizheng Wu and T. Virtanen and Eng Siong Chng and Haizhou Li", title = "Exemplar-Based Sparse Representation With Residual Compensation for Voice Conversion", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1506--1521", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2333242", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Talagala:2014:EMC, author = "D. S. Talagala and Wen Zhang and T. D. Abhayapala", title = "Efficient Multi-Channel Adaptive Room Compensation for Spatial Soundfield Reproduction Using a Modal Decomposition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1522--1532", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2339195", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Abdel-Hamid:2014:CNN, author = "O. Abdel-Hamid and A.-R. Mohamed and Hui Jiang and Li Deng and G. Penn and Dong Yu", title = "Convolutional Neural Networks for Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1533--1545", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2339736", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Koyama:2014:WFR, author = "S. Koyama and K. Furuya and Y. Hiwasaki and Y. Haneda and Y. Suzuki", title = "Wave Field Reconstruction Filtering in Cylindrical Harmonic Domain for With-Height Recording and Reproduction", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1546--1557", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2339735", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2014:PSS, author = "Chia-Ping Chen and Yi-Chin Huang and Chung-Hsien Wu and Kuan-De Lee", title = "Polyglot Speech Synthesis Based on Cross-Lingual Frame Selection Using Auditory and Articulatory Features", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1558--1570", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2339738", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATab, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1571--1572", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2358353", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATac, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1573--1574", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2358354", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:OAh, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1575--1575", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359301", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TWAb, author = "Anonymous", title = "Together, we are advancing technology", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "1576--1576", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359302", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:FCj, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "C1", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2357711", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATad, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "C2", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359294", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:ISPj, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "C3", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359295", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPBj, author = "Anonymous", title = "[{Blank} page --- back cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "10", pages = "C4", month = oct, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359307", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCu, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "1577--1578", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2363751", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCv, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "1579--1580", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2363771", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2014:UAA, author = "Jian Xu and Zhi-Jie Yan and Qiang Huo", title = "An Unsupervised Adaptation Approach to Leveraging Feedback Loop Data by Using $i$-Vector for Data Clustering and Selection", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "1581--1589", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2341911", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cumani:2014:LST, author = "S. Cumani and P. Laface", title = "Large-Scale Training of Pairwise Support Vector Machines for Speaker Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "1590--1600", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2341914", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Du:2014:IVF, author = "Jun Du and Qiang Huo", title = "An Improved {VTS} Feature Compensation using Mixture Models of Distortion and {IVN} Training for Noisy Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "1601--1611", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2341912", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Togami:2014:SOA, author = "M. Togami and Y. Kawaguchi", title = "Simultaneous Optimization of Acoustic Echo Reduction, Speech Dereverberation, and Noise Reduction against Mutual Interference", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "1612--1623", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2341918", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lorente:2014:GIM, author = "J. Lorente and M. Ferrer and M. de Diego and A. Gonzalez", title = "{GPU} Implementation of Multichannel Adaptive Algorithms for Local Active Noise Control", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "1624--1635", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2344852", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Helie:2014:SFO, author = "T. Helie", title = "Simulation of Fractional-Order Low-Pass Filters", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "1636--1647", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2323715", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Defraene:2014:EOB, author = "B. Defraene and T. van Waterschoot and M. Diehl and M. Moonen", title = "Embedded-Optimization-Based Loudspeaker Precompensation Using a {Hammerstein} Loudspeaker Model", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "1648--1659", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2344862", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2014:RBC, author = "Guangsen Wang and Khe Chai Sim", title = "Regression-Based Context-Dependent Modeling of Deep Neural Networks for Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "1660--1669", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2344855", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Badeau:2014:MHR, author = "R. Badeau and M. D. Plumbley", title = "Multichannel High-Resolution {NMF} for Modeling Convolutive Mixtures of Non-Stationary Signals in the Time-Frequency Domain", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "1670--1680", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2341920", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATae, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "1683--1684", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2373579", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATaf, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "1685--1686", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2373580", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPg, author = "Anonymous", title = "[{Blank} page]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "B1681--B1682", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2372931", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:FCk, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "C1", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2360425", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATag, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "C2", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2373573", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:ISPk, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "C3", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2373578", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPBk, author = "Anonymous", title = "[{Blank} page --- back cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "11", pages = "C4", month = nov, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2373672", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:TCw, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1683--1685", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2372211", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Deng:2014:FEK, author = "Deng", title = "Farewell editorial: Keeping up the momentum of innovations", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1687--1687", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2370434", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yella:2014:OSD, author = "S. H. Yella and H. Bourlard", title = "Overlapping Speech Detection Using Long-Term Conversational Features for Speaker Diarization in Meeting Room Conversations", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1688--1700", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2346315", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chivukula:2014:FAL, author = "R. K. Chivukula and Y. A. Reznik and Yanyan Hu and V. Devarajan and M. Jayendra-Lakshman", title = "Fast Algorithms for Low-Delay {TDAC} Filterbanks in {MPEG-4} {AAC--ELD}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1701--1712", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2346314", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xue:2014:FAD, author = "Shaofei Xue and O. Abdel-Hamid and Hui Jiang and Lirong Dai and Qingfeng Liu", title = "Fast Adaptation of Deep Neural Network Based on Discriminant Codes for Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1713--1725", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2346313", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Davies:2014:AAC, author = "M. E. P. Davies and P. Hamel and K. Yoshii and M. Goto", title = "{AutoMashUpper}: Automatic Creation of Multi-Song Music Mashups", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1726--1737", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2347135", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Weng:2014:LSR, author = "Chao Weng and D. L. Thomson and P. Haffner and B.-H. F. Juang", title = "Latent Semantic Rational Kernels for Topic Spotting on Conversational Speech", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1738--1749", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2347133", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wachowski:2014:DCN, author = "N. Wachowski and M. R. Azimi-Sadjadi", title = "Detection and Classification of Nonstationary Transient Signals Using Sparse Approximations and {Bayesian} Networks", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1750--1764", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2348913", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Percival:2014:STE, author = "G. Percival and G. Tzanetakis", title = "Streamlined Tempo Estimation Based on Autocorrelation and Cross-correlation With Pulses", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1765--1776", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2348916", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Barkefors:2014:DAL, author = "A. Barkefors and M. Sternad and L.-J. Brannmark", title = "Design and Analysis of Linear Quadratic {Gaussian} Feedforward Controllers for Active Noise Control", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1777--1791", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2349856", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cobos:2014:CSB, author = "M. Cobos and J. J. Perez-Solano and S. Felici-Castell and J. Segura and J. M. Navarro", title = "Cumulative-Sum-Based Localization of Sound Events in Low-Cost Wireless Acoustic Sensor Networks", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1792--1802", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2351132", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tourbabin:2014:TFO, author = "V. Tourbabin and B. Rafaely", title = "Theoretical Framework for the Optimization of Microphone Array Configuration for Humanoid Robot Audition", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1803--1814", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2351133", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zakharov:2014:SWR, author = "Y. Zakharov and V. H. Nascimento", title = "Sliding-Window {RLS} Low-Cost Implementation of Proportionate Affine Projection Algorithms", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1815--1824", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2352456", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{DAngelo:2014:GMLa, author = "S. D'Angelo and V. Valimaki", title = "Generalized {Moog} Ladder Filter: {Part I} --- Linear Analysis and Parameterization", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1825--1832", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2352495", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2014:BNR, author = "Na Yang and He Ba and Weiyang Cai and I. Demirkol and W. Heinzelman", title = "{BaNa}: a Noise Resilient Fundamental Frequency Detection Algorithm for Speech and Music", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1833--1848", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2352453", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2014:TTS, author = "Yuxuan Wang and A. Narayanan and Deliang Wang", title = "On Training Targets for Supervised Speech Separation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1849--1858", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2352935", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2014:VCU, author = "Ling-Hui Chen and Zhen-Hua Ling and Li-Juan Liu and Li-Rong Dai", title = "Voice Conversion Using Deep Neural Networks With Layer-Wise Generative Training", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1859--1872", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2353991", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{DAngelo:2014:GMLb, author = "S. D'Angelo and V. Valimaki", title = "Generalized {Moog} Ladder Filter: {Part II} --- Explicit Nonlinear Model through a Novel Delay-Free Loop Implementation Method", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1873--1883", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2352556", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rafii:2014:CRB, author = "Z. Rafii and Zhiyao Duan and B. Pardo", title = "Combining Rhythm-Based and Pitch-Based Methods for Background and Melody Separation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1884--1893", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2354242", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ramo:2014:HPP, author = "J. Ramo and V. Valimaki and B. Bank", title = "High-Precision Parallel Graphic Equalizer", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1894--1904", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2354241", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Panagakis:2014:MGC, author = "Y. Panagakis and C. L. Kotropoulos and G. R. Arce", title = "Music Genre Classification via Joint Sparse Low-Rank Representation of Audio Features", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1905--1917", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2355774", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Maezawa:2014:NBD, author = "A. Maezawa and K. Itoyama and K. Yoshii and H. G. Okuno", title = "Nonparametric {Bayesian} Dereverberation of Power Spectrograms Based on Infinite-Order Autoregressive Processes", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1918--1930", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2355772", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Krawczyk:2014:SPR, author = "M. Krawczyk and T. Gerkmann", title = "{STFT} Phase Reconstruction in Voiced Speech for an Improved Single-Channel Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1931--1940", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2354236", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Khanagha:2014:DGC, author = "V. Khanagha and K. Daoudi and H. M. Yahia", title = "Detection of Glottal Closure Instants Based on the Microcanonical Multiscale Formalism", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1941--1950", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2352451", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Venturini:2014:SFF, author = "A. Venturini and L. Zao and R. Coelho", title = "On speech features fusion, $ \alpha $-integration {Gaussian} modeling and multi-style training for noise robust speaker classification", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1951--1964", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2355821", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Foster:2014:SCD, author = "P. Foster and M. Mauch and S. Dixon", title = "Sequential Complexity as a Descriptor for Musical Similarity", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1965--1977", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2357676", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2014:IBE, author = "Gang Liu and J. H. L. Hansen", title = "An Investigation into Back-end Advancements for Speaker Recognition in Multi-Session and Noisy Enrollment Scenarios", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1978--1992", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2352154", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2014:FSC, author = "Jitong Chen and Yuxuan Wang and Deliang Wang", title = "A Feature Study for Classification-Based Speech Separation at Low Signal-to-Noise Ratios", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "1993--2002", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359159", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{vanMourik:2014:EHO, author = "J. van Mourik and D. Murphy", title = "Explicit Higher-Order {FDTD} Schemes for {$3$D} Room Acoustic Simulation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2003--2011", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2341913", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yong:2014:EBM, author = "Pei Chee Yong and S. Nordholm and Hai Huyen Dam", title = "Effective Binaural Multi-Channel Processing Algorithm for Improved Environmental Presence", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2012--2024", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359626", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2014:MSA, author = "A. Chen and M. A. Hasegawa-Johnson", title = "Mixed Stereo Audio Classification Using a Stereo-Input Mixed-to-Panned Level Feature", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2025--2033", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2359628", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Huang:2014:FMS, author = "Gongping Huang and J. Benesty and Tao Long and Jingdong Chen", title = "A Family of Maximum {SNR} Filters for Noise Reduction", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2034--2047", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2360643", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yan:2014:SLS, author = "Su Yan and Xiaojun Wan", title = "{SRRank}: Leveraging Semantic Roles for Extractive Multi-Document Summarization", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2048--2058", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2360461", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tachibana:2014:HPS, author = "H. Tachibana and N. Ono and H. Kameoka and S. Sagayama", title = "Harmonic\slash Percussive Sound Separation Based on Anisotropic Smoothness of Spectrograms", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2059--2073", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2351131", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gil-Cacho:2014:FDA, author = "J. M. Gil-Cacho and T. van Waterschoot and M. Moonen and S. H. Jensen", title = "A Frequency-Domain Adaptive Filter {(FDAF)} Prediction Error Method {(PEM)} Framework for Double-Talk-Robust Acoustic Echo Cancellation", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2074--2086", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2351614", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2014:ISC, author = "Qi Wang and W. L. Woo and S. S. Dlay", title = "Informed Single-Channel Speech Separation Using {HMM--GMM} User-Generated Exemplar Source", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2087--2100", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2357677", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Erro:2014:EIS, author = "D. Erro and T.-C. Zorila and Y. Stylianou", title = "Enhancing the Intelligibility of Statistically Generated Synthetic Speech by Means of Noise-Independent Modifications", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2101--2111", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2361022", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jiang:2014:BCR, author = "Yi Jiang and Deliang Wang and Runsheng Liu and ZhenMing Feng", title = "Binaural Classification for Reverberant Speech Segregation Using Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2112--2121", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2361023", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Su:2014:SMM, author = "Li Su and Hsin-Ming Lin and Yi-Hsuan Yang", title = "Sparse Modeling of Magnitude and Phase-Derived Spectra for Playing Technique Classification", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2122--2132", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2362006", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Reddy:2014:USD, author = "V. V. Reddy and A. W. H. Khong and Boon Poh Ng", title = "Unambiguous Speech {DOA} Estimation Under Spatial Aliasing Conditions", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2133--2145", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2344856", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mohammadi:2014:ESA, author = "A. Mohammadi and S. S. Sarfjoo and C. Demiroglu", title = "Eigenvoice Speaker Adaptation with Minimal Data for Statistical Speech Synthesis Systems Using a {MAP} Approach and Nearest-Neighbors", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2146--2157", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2362009", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Han:2014:NNB, author = "Kun Han and Deliang Wang", title = "Neural Network Based Pitch Tracking in Very Noisy Speech", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2158--2168", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2363410", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mu:2014:MCD, author = "Yongsheng Mu and Peifeng Ji and Wei Ji and Ming Wu and Jun Yang", title = "Modeling and Compensation for the Distortion of Parametric Loudspeakers Using a One-Dimension {Volterra} Filter", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2169--2181", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2363414", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Thiergart:2014:IPS, author = "O. Thiergart and M. Taseska and E. A. P. Habets", title = "An Informed Parametric Spatial Filter Based on Instantaneous Direction-of-Arrival Estimates", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2182--2196", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2363407", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Santos:2014:USC, author = "J. F. Santos and T. H. Falk", title = "Updating the {SRMR--CI} Metric for Improved Intelligibility Prediction for Cochlear Implant Users", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2197--2206", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2363788", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kim:2014:DAB, author = "Seon Man Kim and Hong Kook Kim", title = "Direction-of-Arrival Based {SNR} Estimation for Dual-Microphone Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2207--2217", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2360646", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Otsuka:2014:MSS, author = "T. Otsuka and K. Ishiguro and T. Yoshioka and H. Sawada and H. G. Okuno", title = "Multichannel Sound Source Dereverberation and Separation for Arbitrary Number of Sources Based on {Bayesian} Nonparametrics", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2218--2232", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2363790", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Traa:2014:MSS, author = "J. Traa and P. Smaragdis", title = "Multichannel Source Separation and Tracking With {RANSAC} and Directional Statistics", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2233--2243", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2365701", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2014:FMM, author = "Weifeng Li and Longbiao Wang and Yicong Zhou and J. Dines and M. Magimai-Doss and H. Bourlard and Qingmin Liao", title = "Feature Mapping of Multiple Beamformed Sources for Robust Overlapping Speech Recognition Using a Microphone Array", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2244--2255", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2364130", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{FanChiang:2014:CLC, author = "Y. FanChiang and C.-W. Wei and Y.-L. Meng and Y.-W. Lin and S.-J. Jou and T.-S. Chang", title = "Correction to {``Low Complexity Formant Estimation Adaptive Feedback Cancellation for Hearing Aids Using Pitch Based Processing'' [Aug {\bf 14} 1248--1259]}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2256--2256", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2365971", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", note = "See \cite{FanChiang:2014:LCF}.", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:LR, author = "Anonymous", title = "List of Reviewers", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2257--2259", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2361536", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATah, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2260--2261", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2373633", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATai, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2262--2263", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2373634", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IIA, author = "Anonymous", title = "2014 Index {IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Vol. 22", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "2264--2288", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2373645", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPh, author = "Anonymous", title = "[{Blank} page]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "B1686", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2373632", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:FCl, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "C1", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2373572", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:IATaj, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "C2", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2373574", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:ISPl, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "C3", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2373577", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2014:BPBl, author = "Anonymous", title = "[{Blank} page --- back cover]", journal = j-IEEE-ACM-TASLP, volume = "22", number = "12", pages = "C4", month = dec, year = "2014", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2373671", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:40 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCa, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "1--2", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2392855", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCb, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "3--4", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2392891", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2015:IEE, author = "H Li", title = "Inaugural Editorial: Embracing New Opportunities for Growth", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "5--6", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2390431", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2015:RAS, author = "Yong Xu and Jun Du and Li-Rong Dai and Chin-Hui Lee", title = "A Regression Approach to Speech Enhancement Based on Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "7--19", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2364452", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Phan:2015:RRF, author = "H. Phan and M. Maas and R. Mazur and A. Mertins", title = "Random Regression Forests for Acoustic Event Detection and Classification", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "20--31", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2367814", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2015:JPD, author = "Yuntao Wu and L. Amir and J. R. Jensen and Guisheng Liao", title = "Joint Pitch and {DOA} Estimation Using the {ESPRIT} Method", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "32--45", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2367817", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Decorsiere:2015:IAS, author = "R. Decorsiere and P. L. S{\o}ndergaard and E. N. MacDonald and T. Dau", title = "Inversion of Auditory Spectrograms, Traditional Spectrograms, and Other Envelope Representations", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "46--56", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2367821", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Poignant:2015:USI, author = "J. Poignant and L. Besacier and G. Qu{\'e}not", title = "Unsupervised Speaker Identification in {TV} Broadcast Based on Written Names", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "57--68", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2367822", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tong:2015:RTF, author = "Renjie Tong and Yingyue Zhou and Long Zhang and Guangzhao Bao and Zhongfu Ye", title = "A Robust Time-Frequency Decomposition Model for Suppression of Mixed {Gaussian}-Impulse Noise in Audio Signals", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "69--79", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2371544", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ahani:2015:SRB, author = "S. Ahani and S. Ghaemmaghami and Z. J. Wang", title = "A Sparse Representation-Based Wavelet Domain Speech Steganography Method", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "80--91", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2372313", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/cryptography2010.bib; https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Narayanan:2015:IRD, author = "A. Narayanan and Deliang Wang", title = "Improving Robustness of Deep Neural Network Acoustic Models via Speech Separation and Joint Adaptive Training", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "92--101", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2372314", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Su:2015:ACC, author = "Rongfeng Su and Xunying Liu and Lan Wang", title = "Automatic Complexity Control of Generalized Variable Parameter {HMMs} for Noise Robust Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "102--114", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2372901", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2015:CLA, author = "Zixing Zhang and E. Coutinho and Jun Deng and B. Schuller", title = "Cooperative Learning and its Application to Emotion Recognition from Speech", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "115--126", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2375558", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Su:2015:RDG, author = "Pei-hao Su and Chuan-hsun Wu and Lin-shan Lee", title = "A Recursive Dialogue Game for Personalized Computer-Aided Pronunciation Training", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "127--141", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2375572", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rakotomamonjy:2015:HGT, author = "A. Rakotomamonjy and G. Gasso", title = "Histogram of Gradients of Time--Frequency Representations for Audio Scene Classification", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "142--153", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2375575", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Khoubrouy:2015:HDH, author = "S. A. Khoubrouy and I. M. S. Panahi and J. H. L. Hansen", title = "Howling Detection in Hearing Aids Based on Generalized {Teager--Kaiser} Operator", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "154--161", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2377575", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nielsen:2015:PBP, author = "J. B. B. Nielsen and J. Nielsen and J. Larsen", title = "Perception-Based Personalization of Hearing Aids Using {Gaussian} Processes and Active Learning", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "162--173", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2377581", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jensen:2015:JST, author = "J. R. Jensen and M. G. Christensen and J. Benesty and S. H. Jensen", title = "Joint Spatio-Temporal Filtering Methods for {DOA} and Fundamental Frequency Estimation", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "174--185", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2377583", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jensen:2015:MMS, author = "J. Jensen and Zheng-Hua Tan", title = "Minimum Mean-Square Error Estimation of Mel-Frequency Cepstral Features --- A Theoretically Consistent Approach", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "186--197", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2377591", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Martinez-Hinarejos:2015:UDA, author = "C.-D. Martinez-Hinarejos and J.-M. Benedi and V. Tamarit", title = "Unsegmented Dialogue Act Annotation and Decoding With {$N$}-Gram Transducers", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "198--211", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2377595", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2015:NHD, author = "Lin Wang and Zhe Chen and Fuliang Yin", title = "A Novel Hierarchical Decomposition Vector Quantization Method for High-Order {LPC} Parameters", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "212--221", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2380352", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPa, author = "Anonymous", title = "[{Blank} page]", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "222--222", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2394019", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATa, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "223--224", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2394012", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IAa, author = "Anonymous", title = "Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "225--226", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2394191", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:OAa, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "227--227", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2394018", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:FCa, author = "Anonymous", title = "[{Front} cover]", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "C1", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2393513", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATb, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "C2", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2394171", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:ISPa, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "C3", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2394022", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPBa, author = "Anonymous", title = "[{Blank} page --- back cover]", journal = j-IEEE-ACM-TASLP, volume = "23", number = "1", pages = "C4", month = jan, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2394026", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:41 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCc, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "223--224", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2393691", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCd, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "225--226", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2393693", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hua:2015:TSE, author = "Guang Hua and J. Goh and V. L. L. Thing", title = "Time-Spread Echo-Based Audio Watermarking With Optimized Imperceptibility and Robustness", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "227--239", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2387385", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schwartz:2015:MMS, author = "O. Schwartz and S. Gannot and E. A. P. Habets", title = "Multi-Microphone Speech Dereverberation and Noise Reduction Using Relative Early Transfer Functions", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "240--251", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2372335", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Molina:2015:SST, author = "E. Molina and L. J. Tardon and A. M. Barbancho and I. Barbancho", title = "{SiPTH}: Singing Transcription Based on Hysteresis Defined on the Pitch-Time Curve", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "252--263", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2331102", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2015:ASM, author = "Haipeng Wang and Tan Lee and Cheung-Chi Leung and Bin Ma and Haizhou Li", title = "Acoustic Segment Modeling with Spectral Clustering Methods", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "264--277", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2387382", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Arora:2015:MFE, author = "V. Arora and L. Behera", title = "Multiple {F0} Estimation and Source Clustering of Polyphonic Music Audio Using {PLCA} and {HMRFs}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "278--287", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2387388", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sugiura:2015:RWS, author = "R. Sugiura and Y. Kamamoto and N. Harada and H. Kameoka and T. Moriya", title = "Resolution Warped Spectral Representation for Low-Delay and Low-Bit-Rate Audio {Coder}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "288--299", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2384279", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Weng:2015:DTU, author = "Chao Weng and B.-H. F. Juang", title = "Discriminative Training Using Non-Uniform Criteria for Keyword Spotting on Spontaneous Speech", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "300--312", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2381931", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Matsuyama:2015:AEO, author = "Y. Matsuyama and A. Saito and S. Fujie and T. Kobayashi", title = "Automatic Expressive Opinion Sentence Generation for Enjoyable Conversational Systems", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "313--326", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2363589", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Petkov:2015:SDR, author = "P. N. Petkov and W. B. Kleijn", title = "Spectral Dynamics Recovery for Enhanced Speech Intelligibility in Noise", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "327--338", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2384271", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bicici:2015:OIS, author = "E. Bicici and D. Yuret", title = "Optimizing Instance Selection for Statistical Machine Translation with Feature Decay Algorithms", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "339--350", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2381882", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2015:EDF, author = "Mengqiu Zhang and R. A. Kennedy and T. D. Abhayapala", title = "Empirical Determination of Frequency Representation in Spherical Harmonics-Based {HRTF} Functional Modeling", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "351--360", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2381881", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Feng:2015:TGS, author = "Zu-Ren Feng and Qing Zhou and Jun Zhang and Ping Jiang and Xue-Wen Yang", title = "A Target Guided Subband Filter for Acoustic Event Detection in Noisy Environments Using Wavelet Packets", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "361--372", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2381871", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hirayama:2015:ASR, author = "N. Hirayama and K. Yoshino and K. Itoyama and S. Mori and H. G. Okuno", title = "Automatic Speech Recognition for Mixed Dialect Utterances by Mixing Dialect Language Models", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "373--382", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2387414", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schasse:2015:TSF, author = "A. Schasse and T. Gerkmann and R. Martin and W. Sorgel and T. Pilgrim and H. Puder", title = "Two-Stage Filter-Bank System for Improved Single-Channel Noise Reduction in Hearing Aids", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "383--393", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2365992", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schwartz:2015:OSD, author = "B. Schwartz and S. Gannot and E. A. P. Habets", title = "Online Speech Dereverberation Using {Kalman} Filter and {EM} Algorithm", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "394--406", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2372342", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gerazov:2015:KPF, author = "B. Gerazov and Z. Ivanovski", title = "Kernel Power Flow Orientation Coefficients for Noise-Robust Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "407--419", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2384274", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATc, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "420--421", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2394014", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IAb, author = "Anonymous", title = "Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "422--423", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2394192", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:OAb, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "424--424", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2394016", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:FCb, author = "Anonymous", title = "[{Front} cover]", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "C1", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2393998", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATd, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "C2", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2394172", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:ISPb, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "C3", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2394023", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPBb, author = "Anonymous", title = "[{Blank} page --- back cover]", journal = j-IEEE-ACM-TASLP, volume = "23", number = "2", pages = "C4", month = feb, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2394025", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCe, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "425--426", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2408218", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2015:ISS, author = "H. Li and M. Federico and X. He and H. Meng and I. Trancoso", title = "Introduction to the Special Section on Continuous Space and Related Methods in Natural Language Processing", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "427--430", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2405131", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Adel:2015:SSF, author = "H. Adel and Ngoc Thang Vu and K. Kirchhoff and D. Telaar and T. Schultz", title = "Syntactic and Semantic Features For Code-Switching Factored Language Models", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "431--440", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2389622", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zeng:2015:GBL, author = "Xiaodong Zeng and D. F. Wong and L. S. Chao and I. Trancoso", title = "Graph-Based Lexicon Regularization for {PCFG} With Latent Annotations", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "441--450", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2389034", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2015:DFR, author = "Wenliang Chen and Min Zhang and Yue Zhang", title = "Distributed Feature Representations for Dependency Parsing", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "451--460", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2365359", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fu:2015:LSH, author = "Ruiji Fu and Jiang Guo and Bing Qin and Wanxiang Che and Haifeng Wang and Ting Liu", title = "Learning Semantic Hierarchies: a Continuous Vector Space Approach", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "461--471", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2377580", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Banchs:2015:AFM, author = "R. E. Banchs and L. F. D'Haro and Haizhou Li", title = "Adequacy--Fluency Metrics: Evaluating {MT} in the Continuous Space Model Framework", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "472--482", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2405751", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xiong:2015:TBC, author = "Deyi Xiong and Min Zhang and Xing Wang", title = "Topic-Based Coherence Modeling for Statistical Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "483--493", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2395254", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hutchinson:2015:SPL, author = "B. Hutchinson and M. Ostendorf and M. Fazel", title = "A Sparse Plus Low-Rank Exponential Language Model for Limited Resource Scenarios", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "494--504", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2379593", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rashwan:2015:DLF, author = "M. A. A. Rashwan and A. A. {Al Sallab} and H. M. Raafat and A. Rafea", title = "Deep Learning Framework with Confused Sub-Set Resolution Architecture for Automatic {Arabic} Diacritization", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "505--516", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2395255", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sundermeyer:2015:FRL, author = "M. Sundermeyer and H. Ney and R. Schluter", title = "From Feedforward to Recurrent {LSTM} Neural Networks for Language Modeling", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "517--529", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2400218", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mesnil:2015:URN, author = "G. Mesnil and Y. Dauphin and Kaisheng Yao and Y. Bengio and Li Deng and D. Hakkani-Tur and Xiaodong He and L. Heck and G. Tur and Dong Yu and G. Zweig", title = "Using Recurrent Neural Networks for Slot Filling in Spoken Language Understanding", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "530--539", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2383614", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{McLoughlin:2015:RSE, author = "I. McLoughlin and Haomin Zhang and Zhipeng Xie and Yan Song and Wei Xiao", title = "Robust Sound Event Classification Using Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "540--552", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2389618", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zahoransky:2015:TSS, author = "D. Zahoransky and I. Polasek", title = "Text Search of Surnames in Some {Slavic} and Other Morphologically Rich Languages Using Rule Based Phonetic Algorithms", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "553--563", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2393393", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2015:SDU, author = "Yow-Bang Wang and Lin-shan Lee", title = "Supervised Detection and Unsupervised Discovery of Pronunciation Error Patterns for Computer-Assisted Language Learning", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "564--579", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2387413", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nakashika:2015:VCU, author = "T. Nakashika and T. Takiguchi and Y. Ariki", title = "Voice Conversion Using {RNN} Pre-Trained by Recurrent Temporal Restricted {Boltzmann} Machines", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "580--587", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2379589", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Obin:2015:SMP, author = "N. Obin and P. Lanchantin", title = "Symbolic Modeling of Prosody: From Linguistics to Statistics", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "588--599", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2387389", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATe, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "601--602", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2415973", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IAc, author = "Anonymous", title = "Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "603--604", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2415974", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IMDa, author = "Anonymous", title = "{IEEE} Member Digital Library", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "606--606", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2415994", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPc, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "B600", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2415459", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:FCc, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "C1", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2394831", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATf, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "C2", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2415971", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:ISPc, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "C3", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2415972", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPd, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "23", number = "3", pages = "C4", month = mar, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2415991", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:42 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCf, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "601--602", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2414111", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCg, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "603--604", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2414112", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2015:SEF, author = "Langzhou Chen and N. Braunschweiler and M. J. F. Gales", title = "Speaker and Expression Factorization for Audiobook Data: Expressiveness and Transplantation", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "605--618", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2385478", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2015:COT, author = "Xinjie Zhou and Xiaojun Wan and Jianguo Xiao", title = "{CLOpinionMiner}: Opinion Target Extraction in a Cross-Language Scenario", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "619--630", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2392381", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2015:SCB, author = "Pan Zhou and Hui Jiang and Li-Rong Dai and Yu Hu and Qing-Feng Liu", title = "State-Clustering Based Multiple Deep Neural Networks Modeling Approach for Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "631--642", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2392944", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hu:2015:SSV, author = "Ying Hu and Guizhong Liu", title = "Separation of Singing Voice Using Nonnegative Matrix Partial Co-Factorization for Singer Identification", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "643--653", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2396681", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kitamura:2015:MSS, author = "D. Kitamura and H. Saruwatari and H. Kameoka and Yu. Takahashi and K. Kondo and S. Nakamura", title = "Multichannel Signal Separation Combining Directional Clustering and Nonnegative Matrix Factorization with Spectrogram Restoration", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "654--669", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2401425", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mai:2015:REN, author = "Van-Khanh Mai and D. Pastor and A. Aissa-El-Bey and R. Le-Bidan", title = "Robust Estimation of Non-Stationary Noise Power Spectrum for Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "670--682", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2401426", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Blanco:2015:SLB, author = "E. Blanco and D. Moldovan", title = "A Semantic Logic-Based Approach to Determine Textual Similarity", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "683--693", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2403613", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kim:2015:AIA, author = "Myung Jong Kim and Younggwan Kim and Hoirin Kim", title = "Automatic Intelligibility Assessment of Dysarthric Speech Using Phonologically-Structured Sparse Linear Model", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "694--704", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2403619", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Aneeja:2015:SFF, author = "G. Aneeja and B. Yegnanarayana", title = "Single Frequency Filtering Approach for Discriminating Speech and Nonspeech", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "705--717", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2404035", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Deleforge:2015:CLA, author = "A. Deleforge and R. Horaud and Y. Y. Schechner and L. Girin", title = "Co-Localization of Audio Sources in Images Using Binaural Features and Locally-Linear Regression", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "718--731", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2405475", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dov:2015:AVV, author = "D. Dov and R. Talmon and I. Cohen", title = "Audio-Visual Voice Activity Detection Using Diffusion Maps", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "732--745", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2405481", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Habibi:2015:KEC, author = "M. Habibi and A. Popescu-Belis", title = "Keyword Extraction and Clustering for Document Recommendation in Conversations", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "746--759", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2405482", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mamun:2015:PSI, author = "N. Mamun and W. A. Jassim and M. S. A. Zilany", title = "Prediction of Speech Intelligibility Using a Neurogram Orthogonal Polynomial Measure {(NOPM)}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "760--773", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2401513", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{DeSena:2015:MRG, author = "E. {De Sena} and N. Antonello and M. Moonen and T. van Waterschoot", title = "On the Modeling of Rectangular Geometries in Room Acoustic Simulations", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "774--786", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2405476", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Huang:2015:MFS, author = "Hao Huang and Haihua Xu and Xianhui Wang and W. Silamu", title = "Maximum {F1}-Score Discriminative Training Criterion for Automatic Mispronunciation Detection", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "787--797", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2409733", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2015:IQS, author = "Chung-Che Wang and J.-S. R. Jang", title = "Improving Query-by-Singing\slash Humming by Combining Melody and Lyric Information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "798--806", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2409735", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATg, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "807--808", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2415917", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IAd, author = "Anonymous", title = "Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "809--810", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2415918", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IMDb, author = "Anonymous", title = "{IEEE} Member Digital Library", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "812--812", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2415992", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:FCd, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "C1", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2415914", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATh, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "C2", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2415915", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:ISPd, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "C3", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2415916", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPe, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "23", number = "4", pages = "C4", month = apr, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2415975", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCh, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "813--814", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2425738", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCi, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "815--816", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2425751", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Krebs:2015:IMS, author = "F. Krebs and A. Holzapfel and A. T. Cemgil and G. Widmer", title = "Inferring Metrical Structure in Music Using Particle Filters", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "817--827", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2409737", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cho:2015:UCB, author = "Janghoon Cho and C. D. Yoo", title = "Underdetermined Convolutive {BSS}: {Bayes} Risk Minimization Based on a Mixture of Super-{Gaussian} Posterior Approximation", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "828--839", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2409778", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mu:2015:OAM, author = "Hao Mu and Woon-Seng Gan and Ee-Leng Tan", title = "An Objective Analysis Method for Perceptual Quality of a Virtual {Bass} System", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "840--850", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2409779", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hendriks:2015:ONE, author = "R. C. Hendriks and J. B. Crespo and J. Jensen and C. H. Taal", title = "Optimal Near-End Speech Intelligibility Improvement Incorporating Additive Noise and Late Reverberation Under an Approximation of the Short-Time {SII}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "851--862", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2409780", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Abdelaziz:2015:LDS, author = "A. H. Abdelaziz and S. Zeiler and D. Kolossa", title = "Learning Dynamic Stream Weights For Coupled-{HMM}-Based Audio-Visual Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "863--876", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2409785", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Berkun:2015:CBR, author = "R. Berkun and I. Cohen and J. Benesty", title = "Combined Beamformers for Robust Broadband Regularized Superdirective Beamforming", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "877--886", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2410139", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Breebaart:2015:ESI, author = "J. Breebaart", title = "Evaluation of Statistical Inference Tests Applied to Subjective Audio Quality Data With Small Sample Size", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "887--897", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2412462", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zivanovic:2015:HBC, author = "M. Zivanovi{\'c}", title = "Harmonic Bandwidth Companding for Separation of Overlapping Harmonics in Pitched Signals", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "898--908", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2412464", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chien:2015:LGS, author = "Jen-Tzung Chien", title = "{Laplace} Group Sensing for Acoustic Models", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "909--922", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2412466", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wei:2015:DLC, author = "Ying Wei and Yinfeng Wang", title = "Design of Low Complexity Adjustable Filter Bank for Personalized Hearing Aid Solutions", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "923--931", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2409774", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Perez-Carrillo:2015:IAV, author = "A. Perez-Carrillo and M. M. Wanderley", title = "Indirect Acquisition of Violin Instrumental Controls from Audio Signal with Hidden {Markov} Models", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "932--940", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2410140", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mansikkaniemi:2015:AMB, author = "A. Mansikkaniemi and M. Kurimo", title = "Adaptation of Morph-Based Speech Recognition for Foreign Names and Acronyms", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "941--950", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2414818", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATi, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "953--954", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436492", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IAe, author = "Anonymous", title = "Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "955--956", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436493", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:OAc, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "957--957", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436532", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPf, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "B951--B952", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436491", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:FCe, author = "Anonymous", title = "[{Front} cover]", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "C1", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2426093", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATj, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "C2", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436451", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:ISPe, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "C3", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436531", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPg, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "23", number = "5", pages = "C4", month = may, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436552", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:43 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCj, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "953--954", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2434312", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCk, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "955--956", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2434313", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2015:CRL, author = "Shih-Hung Liu and Kuan-Yu Chen and B. Chen and Hsin-Min Wang and Hsu-Chun Yen and Wen-Lian Hsu", title = "Combining Relevance Language Modeling and Clarity Measure for Extractive Speech Summarization", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "957--969", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2414820", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Niedzwiecki:2015:EID, author = "M. Niedzwiecki and M. Ciolek and K. Cisowski", title = "Elimination of Impulsive Disturbances From Stereo Audio Recordings Using Vector Autoregressive Modeling and Variable-order {Kalman} Filtering", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "970--981", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2414823", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Han:2015:LSM, author = "Kun Han and Yuxuan Wang and Deliang Wang and W. S. Woods and I. Merks and Tao Zhang", title = "Learning Spectral Mapping for Speech Dereverberation and Denoising", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "982--992", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2416653", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Foster:2015:ICS, author = "P. Foster and S. Dixon and A. Klapuri", title = "Identifying Cover Songs Using Information-Theoretic Measures of Similarity", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "993--1005", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2416655", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schwarz:2015:CDP, author = "A. Schwarz and W. Kellermann", title = "Coherent-to-Diffuse Power Ratio Estimation for Dereverberation", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "1006--1018", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2418571", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cernak:2015:ISC, author = "M. Cernak and P. N. Garner and A. Lazaridis and P. Motlicek and Xingyu Na", title = "Incremental Syllable-Context Phonetic Vocoding", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "1019--1030", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2418577", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rouvier:2015:ABV, author = "M. Rouvier and S. Oger and G. Linares and D. Matrouf and B. Merialdo and Y. Li", title = "Audio-Based Video Genre Identification", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "1031--1041", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2014.2387411", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kameoka:2015:GMV, author = "H. Kameoka and K. Yoshizato and T. Ishihara and K. Kadowaki and Y. Ohishi and K. Kashino", title = "Generative Modeling of Voice Fundamental Frequency Contours", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "1042--1053", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2418576", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Markovic:2015:MSI, author = "Dejan Markovi{\'c} and Fabio Antonacci and Augusto Sarti and Stefano Tubaro", title = "Multiview Soundfield Imaging in the Projective Ray Space", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "1054--1067", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2419076", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bates:2015:NSS, author = "A. P. Bates and Z. Khalid and R. A. Kennedy", title = "Novel Sampling Scheme on the Sphere for Head-Related Transfer Function Measurements", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "1068--1081", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2419971", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jia:2015:EMA, author = "Maoshen Jia and Ziyu Yang and Changchun Bao and Xiguang Zheng and C. Ritz", title = "Encoding Multiple Audio Objects Using Intra-Object Sparsity", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "1082--1095", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2419980", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATk, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "1096--1097", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436471", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IAf, author = "Anonymous", title = "Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "1098--1099", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436472", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:OAd, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "1100--1100", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436512", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:FCf, author = "Anonymous", title = "[{Front} cover]", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "C1", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2434971", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATl, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "C2", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436452", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:ISPf, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "C3", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436511", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPh, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "23", number = "6", pages = "C4", month = jun, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436551", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCl, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1101--1102", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2449111", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCm, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1103--1104", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2449131", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{McVicar:2015:ACA, author = "M. McVicar and S. Fukayama and M. Goto", title = "{AutoGuitarTab}: Computer-Aided Composition of Rhythm and Lead Guitar Parts in the Tablature Space", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1105--1117", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2419976", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{VanSegbroeck:2015:RLI, author = "M. {Van Segbroeck} and R. Travadi and S. S. Narayanan", title = "Rapid Language Identification", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1118--1129", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2419978", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Marelli:2015:EAH, author = "D. Marelli and R. Baumgartner and P. Majdak", title = "Efficient Approximation of Head-Related Transfer Functions in Subbands for Accurate Sound Localization", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1130--1143", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2425219", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yeh:2015:IFR, author = "Ching-Feng Yeh and Lin-shan Lee", title = "An Improved Framework for Recognizing Highly Imbalanced Bilingual Code-Switched Lectures with Cross-Language Acoustic Modeling and Frame-Level Language Identification", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1144--1159", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2425214", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Basaran:2015:PMB, author = "D. Basaran and A. T. Cemgil and E. Anarim", title = "A Probabilistic Model-Based Approach for Aligning Multiple Audio Sequences", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1160--1171", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2419972", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2015:MLD, author = "Dongpeng Chen and B. K.-W. Mak", title = "Multitask Learning of Deep Neural Networks for Low-Resource Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1172--1183", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2422573", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Meyer:2015:DDC, author = "T. Meyer and N. Hajlaoui and A. Popescu-Belis", title = "Disambiguating Discourse Connectives for Statistical Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1184--1197", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2422576", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Remes:2015:BCM, author = "U. Remes and A. Ramirez Lopez and K. Palomaki and M. Kurimo", title = "Bounded Conditional Mean Imputation with Observation Uncertainties and Acoustic Model Adaptation", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1198--1208", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2424322", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2015:BCS, author = "Rui Wang and Hai Zhao and Bao-Liang Lu and M. Utiyama and E. Sumita", title = "Bilingual Continuous-Space Language Model Growing for Statistical Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1209--1220", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2425220", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chong:2015:DWP, author = "Tze Yuang Chong and R. E. Banchs and Eng Siong Chng and Haizhou Li", title = "Decoupling Word-Pair Distance and Co-occurrence Information for Effective Long History Context Language Modeling", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1221--1232", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2425223", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sun:2015:SEU, author = "Meng Sun and Yinan Li and J. F. Gemmeke and Xiongwei Zhang", title = "Speech Enhancement Under Low {SNR} Conditions Via Noise Estimation Using Sparse and Low-Rank {NMF} with {Kullback--Leibler} Divergence", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1233--1242", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2427520", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATm, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1245--1246", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2458048", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IAg, author = "Anonymous", title = "Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "1247--1248", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2458049", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPi, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "B1243--B1244", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2455911", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:FCg, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "C1", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2438272", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATn, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "C2", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2458031", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:ISPg, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "C3", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2458046", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPj, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "23", number = "7", pages = "C4", month = jul, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2458047", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:44 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCn, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1245--1246", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2456451", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCo, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1247--1248", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2456473", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Momeni:2015:JDE, author = "H. Momeni and H. R. Abutalebi and A. Tadaion", title = "Joint Detection and Estimation of Speech Spectral Amplitude Using Noncontinuous Gain Functions", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1249--1258", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2427522", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chien:2015:HPY, author = "Jen-Tzung Chien", title = "Hierarchical {Pitman--Yor--Dirichlet} Language Model", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1259--1272", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2428632", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fallahpour:2015:AWB, author = "M. Fallahpour and D. Megias", title = "Audio Watermarking Based on {Fibonacci} Numbers", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1273--1282", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2430818", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mowlaee:2015:PES, author = "P. Mowlaee and J. Kulmer", title = "Phase Estimation in Single-Channel Speech Enhancement: Limits-Potential", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1283--1294", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2430820", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Morchid:2015:CMR, author = "M. Morchid and M. Bouallegue and R. Dufour and G. Linares and D. Matrouf and R. {De Mori}", title = "Compact Multiview Representation of Documents Based on the Total Variability Space", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1295--1308", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2431854", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sugiura:2015:OCG, author = "R. Sugiura and Y. Kamamoto and N. Harada and H. Kameoka and T. Moriya", title = "Optimal Coding of Generalized-{Gaussian}-Distributed Frequency Spectra for Low-Delay Audio {Coder} With Powered All-Pole Spectrum Estimation", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1309--1321", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2431851", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2015:EBN, author = "Kuan-Yu Chen and Shih-Hung Liu and B. Chen and Hsin-Min Wang and Ea-Ee Jan and Wen-Lian Hsu and Hsin-Hsi Chen", title = "Extractive Broadcast News Summarization Leveraging Recurrent Neural Network Language Modeling Techniques", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1322--1334", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2432578", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Koldovsky:2015:SSS, author = "Z. Koldovsky and J. Malek and S. Gannot", title = "Spatial Source Subtraction Based on Incomplete Measurements of Relative Transfer Function", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1335--1347", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2425213", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dimitriadis:2015:UMM, author = "D. Dimitriadis and E. Bocchieri", title = "Use of Micro-Modulation Features in Large Vocabulary Continuous Speech Recognition Tasks", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1348--1357", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2430815", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2015:SBT, author = "Xun Wang and Y. Yoshida and T. Hirao and M. Nagata and K. Sudoh", title = "Summarization Based on Task-Oriented Discourse Parsing", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1358--1367", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2432573", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Spa:2015:GIE, author = "C. Spa and A. Rey and E. Hernandez", title = "A {GPU} Implementation of an Explicit Compact {FDTD} Algorithm with a Digital Impedance Filter for Room Acoustics Applications", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1368--1380", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2434212", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATo, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1381--1382", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2456642", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IAh, author = "Anonymous", title = "Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "1383--1384", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2456643", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:FCh, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "C1", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2458092", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATp, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "C2", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2458032", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:ISPh, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "C3", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2458045", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPk, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "23", number = "8", pages = "C4", month = aug, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2458431", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCp, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1385--1386", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2471806", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCq, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1387--1388", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2471875", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lee:2015:SCR, author = "Lin-shan Lee and J. Glass and Hung-yi Lee and Chun-an Chan", title = "Spoken Content Retrieval --- Beyond Cascading Speech Recognition with Text Retrieval", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1389--1420", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2438543", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jiao:2015:CWC, author = "Yishan Jiao and V. Berisha and Ming Tu and J. Liss", title = "Convex Weighting Criteria for Speaking Rate Estimation", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1421--1430", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2434213", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{He:2015:PAE, author = "Jianjun He and Woon-Seng Gan and Ee-Leng Tan", title = "Primary-Ambient Extraction Using Ambient Spectrum Estimation for Immersive Spatial Audio Reproduction", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1431--1444", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2434272", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", note = "See comments \cite{Lu:2024:CXP}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shen:2015:LCD, author = "Qing Shen and Wei Liu and Wei Cui and Siliang Wu and Y. D. Zhang and M. G. Amin", title = "Low-Complexity Direction-of-Arrival Estimation Based on Wideband Co-Prime Arrays", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1445--1456", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436214", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chien:2015:APM, author = "Yu-Ren Chien and Hsin-Min Wang and Shyh-Kang Jeng", title = "An Acoustic-Phonetic Model of {F0} Likelihood for Vocal Melody Extraction", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1457--1468", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2436345", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cui:2015:DAD, author = "Xiaodong Cui and V. Goel and B. Kingsbury", title = "Data Augmentation for Deep Neural Network Acoustic Modeling", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1469--1477", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2438544", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{DeSena:2015:ESR, author = "E. {De Sena} and H. Hac{\i}habibo{\u{g}}lu and Z. Cvetkovi{\'c} and J. O. Smith", title = "Efficient Synthesis of Room Acoustics via Scattering Delay Networks", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1478--1492", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2438547", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2015:NPS, author = "Lin Wang and T. Gerkmann and S. Doclo", title = "Noise Power Spectral Density Estimation Using {MaxNSR} Blocking Matrix", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1493--1508", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2438542", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jukic:2015:MCL, author = "A. Jukic and T. van Waterschoot and T. Gerkmann and S. Doclo", title = "Multi-Channel Linear Prediction-Based Speech Dereverberation With Sparse Priors", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1509--1520", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2438549", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mowlaee:2015:HPE, author = "P. Mowlaee and J. Kulmer", title = "Harmonic Phase Estimation in Single-Channel Speech Enhancement Using Phase Decomposition and {SNR} Information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1521--1532", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2439038", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATq, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1535--1536", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479177", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IAi, author = "Anonymous", title = "Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1537--1538", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479178", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:HCYa, author = "Anonymous", title = "How can you get your idea to market first?", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "1539--1539", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479184", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPl, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "B1533--B1534", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479179", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:FCi, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "C1", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2446545", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATr, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "C2", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2478021", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:ISPi, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "C3", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479182", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPm, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "23", number = "9", pages = "C4", month = sep, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479186", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:45 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCr, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1535--1536", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479047", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:TCs, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1537--1538", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479057", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tervo:2015:DAE, author = "S. Tervo and A. Politis", title = "Direction of Arrival Estimation of Reflections from Room Impulse Responses Using a Spherical Microphone Array", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1539--1551", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2439573", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2015:SEV, author = "Jia-Ching Wang and Yu-Hao Chin and Bo-Wei Chen and Chang-Hong Lin and Chung-Hsien Wu", title = "Speech Emotion Verification Using Emotion Variance Modeling and Discriminant Scale-Frequency Maps", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1552--1562", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2438535", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Canclini:2015:RLC, author = "A. Canclini and P. Bestagini and F. Antonacci and M. Compagnoni and A. Sarti and S. Tubaro", title = "A Robust and Low-Complexity Source Localization Algorithm for Asynchronous Distributed Microphone Networks", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1563--1575", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2439040", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{He:2015:TSB, author = "Jianjun He and Woon-Seng Gan and Ee-Leng Tan", title = "Time-Shifting Based Primary-Ambient Extraction for Spatial Audio Reproduction", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1576--1588", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2439577", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shah:2015:NAE, author = "P. Shah and I. Lewis and S. Grant and S. Angrignon", title = "Nonlinear Acoustic Echo Cancellation Using Voltage and Current Feedback", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1589--1599", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2425955", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Su:2015:CST, author = "Li Su and Yi-Hsuan Yang", title = "Combining Spectral and Temporal Representations for Multipitch Estimation of Polyphonic Music", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1600--1612", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2442411", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fujioka:2015:HPH, author = "T. Fujioka and Y. Nagata and M. Abe", title = "High-Precision Harmonic Distortion Level Measurement of a Loudspeaker Using Adaptive Filters in a Noisy Environment", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1613--1622", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2442415", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hon:2015:AFM, author = "Tsz-Kin Hon and Lin Wang and J. D. Reiss and A. Cavallaro", title = "Audio Fingerprinting for Multi-Device Self-Localization", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1623--1636", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2442417", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tian:2015:DIU, author = "Ye Tian and Zhe Chen and Fuliang Yin", title = "Distributed {IMM}-Unscented {Kalman} Filter for Speaker Tracking in Microphone Array Networks", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1637--1647", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2442418", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2015:SIP, author = "Na Li and Man-Wai Mak", title = "{SNR}-Invariant {PLDA} Modeling in Nonparametric Subspace for Robust Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1648--1659", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2442757", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Vilkamo:2015:PRS, author = "J. Vilkamo and S. Delikaris-Manias", title = "Perceptual Reproduction of Spatial Sound Using Loudspeaker-Signal-Domain Parametrization", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1660--1669", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2443977", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Weng:2015:DNN, author = "Chao Weng and Dong Yu and M. L. Seltzer and J. Droppo", title = "Deep Neural Networks for Single-Channel Multi-Talker Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1670--1679", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2444659", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ruhland:2015:RGS, author = "M. Ruhland and J. Bitzer and M. Brandt and S. Goetze", title = "Reduction of {Gaussian}, Supergaussian, and Impulsive Noise by Interpolation of the Binary Mask Residual", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1680--1691", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2444664", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dorfan:2015:TBR, author = "Y. Dorfan and S. Gannot", title = "Tree-Based Recursive Expectation-Maximization Algorithm for Localization of Acoustic Sources", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1692--1703", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2444654", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATs, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing EDICS}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1704--1705", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479175", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IAj, author = "Anonymous", title = "Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1706--1707", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479176", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:HCYb, author = "Anonymous", title = "How can you get your idea to market first?", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "1708--1708", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479183", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:FCj, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "C1", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479187", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:IATt, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "C2", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479180", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:ISPj, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "C3", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479181", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:BPn, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "23", number = "10", pages = "C4", month = oct, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479185", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sarmiento:2015:CFB, author = "A. Sarmiento and I. Duran-Diaz and A. Cichocki and S. Cruces", title = "A Contrast Function Based on Generalized Divergences for Solving the Permutation Problem in Convolved Speech Mixtures", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1713--1726", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2447281", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2015:CSI, author = "Xiaojia Zhao and Yuxuan Wang and Deliang Wang", title = "Cochannel Speaker Identification in Anechoic and Reverberant Conditions", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1727--1736", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2447284", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2015:APS, author = "Liang-Yu Chen and J.-S. R. Jang", title = "Automatic Pronunciation Scoring with Score Combination by Learning to Rank and Class-Normalized {DP}-Based Quantization", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1737--1749", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2449089", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tang:2015:JSC, author = "Duyu Tang and Bing Qin and Furu Wei and Li Dong and Ting Liu and Ming Zhou", title = "A Joint Segmentation and Classification Framework for Sentence Level Sentiment Classification", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1750--1761", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2449071", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hoffmann:2015:TSA, author = "F.-M. Hoffmann and F. M. Fazi", title = "Theoretical Study of Acoustic Circular Arrays With Tangential Pressure Gradient Sensors", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1762--1774", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2449083", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Souviraa-Labastie:2015:MCA, author = "N. Souviraa-Labastie and A. Olivero and E. Vincent and F. Bimbot", title = "Multi-Channel Audio Source Separation Using Multiple Deformed References", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1775--1787", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2450494", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Baby:2015:CDE, author = "D. Baby and T. Virtanen and J. F. Gemmeke and H. {Van hamme}", title = "Coupled Dictionaries for Exemplar-Based Speech Enhancement and Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1788--1799", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2450491", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Islam:2015:SEB, author = "M. T. Islam and C. Shahnaz and Wei-Ping Zhu and M. O. Ahmad", title = "Speech Enhancement Based on Student Modeling of Teager Energy Operated Perceptual Wavelet Packet Coefficients and a Custom Thresholding Function", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1800--1811", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2443983", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Do:2015:DAS, author = "Quynh Thi Ngoc Do and S. Bethard and M.-F. Moens", title = "Domain Adaptation in Semantic Role Labeling Using a Neural Language Model and Linguistic Resources", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1812--1823", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2449072", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Aragonda:2015:DNS, author = "H. Aragonda and C. S. Seelamantula", title = "Demodulation of Narrowband Speech Spectrograms Using the {Riesz} Transform", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1824--1834", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2449088", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tran:2015:NUE, author = "D. T. Tran and E. Vincent and D. Jouvet", title = "Nonparametric Uncertainty Estimation and Propagation for Noise Robust {ASR}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1835--1846", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2450497", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tu:2015:EDF, author = "Mei Tu and Yu Zhou and Chengqing Zong", title = "Exploring Diverse Features for Statistical Machine Translation Model Pruning", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1847--1857", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2456413", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Okopal:2015:SAS, author = "G. Okopal and S. Wisdom and L. Atlas", title = "Speech Analysis With the Strong Uncorrelating Transform", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1858--1868", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2456426", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Galvez:2015:TDO, author = "M. F. Simon Galvez and S. J. Elliott and J. Cheer", title = "Time Domain Optimization of Filters Used in a Loudspeaker Array for Personal Audio", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1869--1878", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2456428", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bokaei:2015:LDS, author = "M. H. Bokaei and H. Sameti and Yang Liu", title = "Linear Discourse Segmentation of Multi-Party Meetings Based on Local and Global Information", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1879--1891", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2456430", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2015:CSE, author = "Chung-Hsien Wu and Han-Ping Shen and Chun-Shan Hsu", title = "Code-Switching Event Detection by Using a Latent Language Space Model and the Delta-{Bayesian} Information Criterion", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1892--1903", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2456417", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2015:OMS, author = "Zhangli Chen and V. Hohmann", title = "Online Monaural Speech Enhancement Based on Periodicity Analysis and A Priori {SNR} Estimation", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1904--1916", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2456423", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sarreshtedari:2015:WMD, author = "S. Sarreshtedari and M. A. Akhaee and A. Abbasfar", title = "A Watermarking Method for Digital Speech Self-Recovery", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1917--1925", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2456431", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Moritz:2015:AIA, author = "N. Moritz and J. Anemuller and B. Kollmeier", title = "An Auditory Inspired Amplitude Modulation Filter Bank for Robust Feature Extraction in Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1926--1937", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2456420", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Miao:2015:SAT, author = "Yajie Miao and Hao Zhang and F. Metze", title = "Speaker Adaptive Training of Deep Neural Network Acoustic Models Using {$I$}-Vectors", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1938--1949", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2457612", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Morfi:2015:SAS, author = "V. Morfi and G. Degottex and A. Mouchtaris", title = "Speech Analysis and Synthesis with a Computationally Efficient Adaptive Harmonic Model", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1950--1962", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2458580", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dennis:2015:GHT, author = "J. Dennis and H. D. Tran and Haizhou Li", title = "Generalized {Hough} Transform for Speech Pattern Classification", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1963--1972", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2459599", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Deng:2015:SHM, author = "Feng Deng and Changchun Bao and W. B. Kleijn", title = "Sparse Hidden {Markov} Models for Speech Enhancement in Non-Stationary Noise Environments", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1973--1987", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2458585", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ranjan:2015:NLH, author = "R. Ranjan and Woon-Seng Gan", title = "Natural Listening over Headphones in Augmented Reality Using Adaptive Filtering Techniques", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "1988--2002", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2460459", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2015:DGA, author = "L.-H. Chen and T. Raitio and C. Valentini-Botinhao and Z.-H. Ling and J. Yamagishi", title = "A Deep Generative Architecture for Postfiltering in Statistical Parametric Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "2003--2014", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2461448", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shin:2015:PSE, author = "Ho Seon Shin and T. Fingscheidt and Hong-Goo Kang", title = "A Priori {SNR} Estimation Using Air- and Bone-Conduction Microphones", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "2015--2025", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2446202", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2015:PFR, author = "Ji Wu and Miao Li and Chin-Hui Lee", title = "A Probabilistic Framework for Representing Dialog Systems and Entropy-Based Dialog Management Through Dynamic Stochastic State Evolution", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "2026--2035", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2462712", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cumani:2015:FSF, author = "S. Cumani", title = "Fast Scoring of Full Posterior {PLDA} Models", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "2036--2045", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2464678", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tourbabin:2015:DAE, author = "V. Tourbabin and B. Rafaely", title = "Direction of Arrival Estimation Using Microphone Array Processing for Moving Humanoid Robots", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "2046--2058", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2464671", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chu:2015:NLP, author = "Y. J. Chu and S. C. Chan", title = "A New Local Polynomial Modeling-Based Variable Forgetting Factor {RLS} Algorithm and Its Acoustic Applications", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "2059--2069", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2464692", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{de-la-Calle-Silos:2015:MFP, author = "F. de-la-Calle-Silos and F. J. Valverde-Albacete and A. Gallardo-Antolin and C. Pelaez-Moreno", title = "Morphologically Filtered Power-Normalized Cochleograms as Robust, Biologically Inspired Features for {ASR}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "2070--2080", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2464691", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hirao:2015:SDT, author = "T. Hirao and M. Nishino and Y. Yoshida and J. Suzuki and N. Yasuda and M. Nagata", title = "Summarizing a Document by Trimming the Discourse Tree", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "2081--2092", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2465150", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pan:2015:TAD, author = "Chao Pan and Jingdong Chen and J. Benesty", title = "Theoretical Analysis of Differential Microphone Array Beamforming and an Improved Solution", journal = j-IEEE-ACM-TASLP, volume = "23", number = "11", pages = "2093--2105", month = nov, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2469142", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Oct 5 06:29:46 MDT 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Che:2015:SCA, author = "Wanxiang Che and Yanyan Zhao and Honglei Guo and Zhong Su and Ting Liu", title = "Sentence Compression for Aspect-Based Sentiment Analysis", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2111--2124", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2443982", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sheaffer:2015:BRF, author = "J. Sheaffer and M. van Walstijn and B. Rafaely and K. Kowalczyk", title = "Binaural Reproduction of Finite Difference Simulations Using Spherical Array Processing", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2125--2135", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2468066", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Huang:2015:JOM, author = "Po-Sen Huang and Minje Kim and M. Hasegawa-Johnson and P. Smaragdis", title = "Joint Optimization of Masks and Deep Recurrent Neural Networks for Monaural Source Separation", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2136--2147", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2468583", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Heidel:2015:FCF, author = "A. Heidel and Hsiang-Hung Lu and Lin-Shan Lee", title = "Finding Complex Features for Guest Language Fragment Recovery in Resource-Limited Code-Mixed Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2148--2161", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2469634", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Marquardt:2015:ICP, author = "D. Marquardt and V. Hohmann and S. Doclo", title = "Interaural Coherence Preservation in Multi-Channel {Wiener} Filtering-Based Noise Reduction for Binaural Hearing Aids", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2162--2176", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2471096", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yu:2015:CMB, author = "Kai Yu and Kai Sun and Lu Chen and Su Zhu", title = "Constrained {Markov} {Bayesian} Polynomial for Efficient Dialogue State Tracking", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2177--2188", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2470597", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anderson:2015:SRF, author = "C. A. Anderson and P. D. Teal and M. A. Poletti", title = "Spatially Robust Far-field Beamforming Using the {von Mises(--Fisher)} Distribution", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2189--2197", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2473684", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schroder:2015:STG, author = "J. Schroder and S. Goetze and J. Anemuller", title = "Spectro-Temporal {Gabor} Filterbank Features for Acoustic Event Detection", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2198--2208", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2467964", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Heo:2015:CBS, author = "Inseok Heo and W. A. Sethares", title = "Classification Based on Speech Rhythm via a Temporal Alignment of Spoken Sentences", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2209--2216", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2475155", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Samarasinghe:2015:EPR, author = "P. Samarasinghe and T. Abhayapala and M. Poletti and T. Betlehem", title = "An Efficient Parameterization of the Room Transfer Function", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2217--2227", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2475173", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xiang:2015:SSB, author = "Yong Xiang and I. Natgunanathan and Yue Rong and Song Guo", title = "Spread Spectrum-Based High Embedding Capacity Watermarking Method for Audio Signals", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2228--2237", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2476755", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yoo:2015:FBR, author = "In-Chul Yoo and Hyeontaek Lim and Dongsuk Yook", title = "Formant-Based Robust Voice Activity Detection", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2238--2245", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2476762", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hueber:2015:SAA, author = "T. Hueber and L. Girin and X. Alameda-Pineda and G. Bailly", title = "Speaker-Adaptive Acoustic-Articulatory Inversion Using Cascaded {Gaussian} Mixture Regression", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2246--2259", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2464702", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bai:2015:LRS, author = "Hequn Bai and G. Richard and L. Daudet", title = "Late Reverberation Synthesis: From Radiance Transfer to Feedback Delay Networks", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2260--2271", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2478116", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bayram:2015:MAD, author = "I. Bayram", title = "A Multichannel Audio Denoising Formulation Based on Spectral Sparsity", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2272--2285", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479042", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Delgado:2015:FSC, author = "H. Delgado and X. Anguera and C. Fredouille and J. Serrano", title = "Fast Single- and Cross-Show Speaker Diarization Using Binary Key Speaker Modeling", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2286--2297", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479043", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Percybrooks:2015:NHB, author = "W. S. Percybrooks and E. Moore", title = "A New {HMM}-Based Voice Conversion Methodology Evaluated on Monolingual and Cross-Lingual Conversion Tasks", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2298--2310", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479040", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Graja:2015:SFK, author = "M. Graja and M. Jaoua and L. H. Belguith", title = "Statistical Framework with Knowledge Base Integration for Robust Speech Understanding of the {Tunisian} Dialect", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2311--2321", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2464687", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Strasser:2015:AFC, author = "F. Strasser and H. Puder", title = "Adaptive Feedback Cancellation for Realistic Hearing Aid Applications", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2322--2333", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479038", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yeung:2015:SSM, author = "Yu Ting Yeung and Tan Lee and Cheung-Chi Leung", title = "Supervised Single-Microphone Multi-Talker Speech Separation with Conditional Random Fields", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2334--2342", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479039", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jin:2015:TDM, author = "Wenyu Jin and W. B. Kleijn", title = "Theory and Design of Multizone Soundfield Reproduction Using Sparse Methods", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2343--2355", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479037", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhong:2015:TFM, author = "Xionghu Zhong and J. R. Hopgood", title = "A {Time--Frequency} Masking Based Random Finite Set Particle Filtering Method for Multiple Acoustic Source Detection and Tracking", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2356--2370", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479041", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Vijayan:2015:APS, author = "K. Vijayan and K. S. R. Murty", title = "Analysis of Phase Spectrum of Speech Signals Using Allpass Modeling", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2371--2383", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479045", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Marquardt:2015:TAL, author = "D. Marquardt and E. Hadad and S. Gannot and S. Doclo", title = "Theoretical Analysis of Linearly Constrained Multi-Channel {Wiener} Filtering Algorithms for Combined Noise Reduction and Binaural Cue Preservation in Binaural Hearing Aids", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2384--2397", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2479940", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zohrer:2015:RLS, author = "M. Zohrer and R. Peharz and F. Pernkopf", title = "Representation Learning for Single-Channel Source Separation and Bandwidth Extension", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2398--2409", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2470560", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fang:2015:ELM, author = "Hao Fang and M. Ostendorf and P. Baumann and J. Pierrehumbert", title = "Exponential Language Modeling Using Morphological Features and Multi-Task Learning", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2410--2421", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2482118", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Carlin:2015:FSA, author = "M. A. Carlin and M. Elhilali", title = "A Framework for Speech Activity Detection Using Adaptive Auditory Receptive Fields", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2422--2433", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2481179", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Saito:2015:CBS, author = "S. Saito and K. Oishi and T. Furukawa", title = "Convolutive Blind Source Separation Using an Iterative Least-Squares Algorithm for Non-Orthogonal Approximate Joint Diagonalization", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2434--2448", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2485663", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hadad:2015:TAB, author = "E. Hadad and D. Marquardt and S. Doclo and S. Gannot", title = "Theoretical Analysis of Binaural Transfer Function {MVDR} Beamformers with Interference Cue Preservation Constraints", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2449--2464", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2486381", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2015:PEU, author = "Guang Yang and R. F. Lyon and E. M. Drakakis", title = "Psychophysical Evaluation of An Ultra-Low Power, Analog Biomimetic Cochlear Implant Processor Filterbank Architecture With Across Channels {AGC}", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2465--2473", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2488290", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2015:LR, author = "Anonymous", title = "List of Reviewers", journal = j-IEEE-ACM-TASLP, volume = "23", number = "12", pages = "2474--2476", month = dec, year = "2015", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2488318", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Nov 17 07:34:26 MST 2015", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCa, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "1--2", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2510059", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCb, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "3--4", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2510138", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Brognaux:2016:HBS, author = "S. Brognaux and T. Drugman", title = "{HMM}-Based Speech Segmentation: Improvements of Fully Automatic Approaches", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "5--15", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2456421", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tahon:2016:TSS, author = "M. Tahon and L. Devillers", title = "Towards a Small Set of Robust Acoustic Features for Emotion Recognition: Challenges", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "16--28", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2487051", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Behravan:2016:VMS, author = "H. Behravan and V. Hautamaki and S. M. Siniscalchi and T. Kinnunen and Chin-Hui Lee", title = "$i$-Vector Modeling of Speech Attributes for Automatic Foreign Accent Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "29--41", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2489558", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Saeidi:2016:FEU, author = "R. Saeidi and P. Alku and T. Backstrom", title = "Feature Extraction Using Power-Law Adjusted Linear Prediction With Application to Speaker Recognition Under Severe Vocal Effort Mismatch", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "42--53", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2493366", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ardekani:2016:SIP, author = "I. T. Ardekani and J. P. Kaipio and A. Nasiri and H. Sharifzadeh and W. H. Abdulla", title = "A Statistical Inverse Problem Approach to Online Secondary Path Modeling in Active Noise Control", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "54--64", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2495249", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Stafylakis:2016:SCF, author = "T. Stafylakis and P. Kenny and M. J. Alam and M. Kockmann", title = "Speaker and Channel Factors in Text-Dependent Speaker Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "65--78", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2497248", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{He:2016:UPB, author = "Yanzhang He and P. Baumann and Hao Fang and B. Hutchinson and A. Jaech and M. Ostendorf and E. Fosler-Lussier and J. Pierrehumbert", title = "Using Pronunciation-Based Morphological Subword Units to Improve {OOV} Handling in Keyword Search", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "79--92", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2496222", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sun:2016:UNE, author = "Meng Sun and Xiongwei Zhang and H. {Van Hamme} and T. F. Zheng", title = "Unseen Noise Estimation Using Separable Deep Auto Encoder for Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "93--104", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2498101", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ferrer:2016:SSB, author = "L. Ferrer and Yun Lei and M. McLaren and N. Scheffer", title = "Study of Senone-Based Deep Neural Network Approaches for Spoken Language Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "105--116", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2496226", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Adalbjornsson:2016:SLH, author = "S. I. Adalbjornsson and T. Kronvall and S. Burgess and K. Astrom and A. Jakobsson", title = "Sparse Localization of Harmonic Audio Sources", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "117--129", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2497798", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mak:2016:MPN, author = "Man-Wai Mak and Xiaomin Pang and Jen-Tzung Chien", title = "Mixture of {PLDA} for Noise Robust {$I$}-Vector Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "130--142", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2499038", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anderson:2016:SCR, author = "C. A. Anderson and P. D. Teal and M. A. Poletti", title = "Spatial Correlation of Radial {Gaussian} and Uniform Spherical Volume Near-Field Source Distributions", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "143--150", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2500028", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Torres:2016:NEM, author = "H. Torres and J. Gurlekian", title = "Novel Estimation Method for the Superpositional Intonation Model", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "151--160", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2500728", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bilbao:2016:FVT, author = "S. Bilbao and B. Hamilton and J. Botts and L. Savioja", title = "Finite Volume Time Domain Room Acoustics Simulation under General Impedance Boundary Conditions", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "161--173", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2500018", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Torbati:2016:DHD, author = "A. H. Harati Nejad Torbati and J. Picone", title = "A Doubly Hierarchical {Dirichlet} Process Hidden {Markov} Model with a Non-Ergodic Structure", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "174--184", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2500732", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chien:2016:BFL, author = "Jen-Tzung Chien and Po-Kai Yang", title = "{Bayesian} Factorization and Learning for Monaural Source Separation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "185--195", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2502141", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Alon:2016:BOA, author = "D. L. Alon and B. Rafaely", title = "Beamforming with Optimal Aliasing Cancellation in Spherical Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "196--210", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2502059", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATa, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Edics", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "211--212", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2519646", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IAa, author = "Anonymous", title = "Information for authors", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "213--214", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2519647", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:SISa, author = "Anonymous", title = "Special issue on sound scene and event analysis", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "215", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2519218", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:FCa, author = "Anonymous", title = "[{Front} cover]", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "C1", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2510838", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATb, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "C2", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2519644", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:ISPa, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "C3", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2519645", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:BPa, author = "Anonymous", title = "[{Blank} page]", journal = j-IEEE-ACM-TASLP, volume = "24", number = "1", pages = "C4", month = jan, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2519643", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCc, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "211--212", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2517760", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCd, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "213--214", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2517798", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rasumow:2016:RAS, author = "E. Rasumow and M. Hansen and S. van de Par and D. Puschel and V. Mellert and S. Doclo and M. Blau", title = "Regularization Approaches for Synthesizing {HRTF} Directivity Patterns", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "215--225", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2504874", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pan:2016:DDP, author = "Chao Pan and J. Benesty and Jingdong Chen", title = "Design of Directivity Patterns with a Unique Null of Maximum Multiplicity", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "226--235", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2504866", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hung:2016:RSR, author = "Jeih-Weih Hung and Hsin-Ju Hsieh and Berlin Chen", title = "Robust Speech Recognition via Enhancing the Complex-Valued Acoustic Spectrum in Modulation Domain", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "236--251", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2504781", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2016:BCI, author = "Xiao-Lei Zhang and DeLiang Wang", title = "Boosting Contextual Information for Deep Neural Network Based Voice Activity Detection", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "252--264", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2505415", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Turan:2016:SFE, author = "M. A. Tugtekin Turan and E. Erzin", title = "Source and Filter Estimation for Throat-Microphone Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "265--275", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2499040", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mohammadiha:2016:SDU, author = "N. Mohammadiha and S. Doclo", title = "Speech Dereverberation Using Non-Negative Convolutive Transfer Function and Spectro-Temporal Modeling", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "276--289", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2501724", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sharma:2016:TSS, author = "A. Sharma and S. Kaul", title = "Two-Stage Supervised Learning-Based Method to Detect Screams and Cries in Urban Environments", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "290--299", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2506264", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2016:DFF, author = "Xiaoguang Wu and Huawei Chen", title = "Directivity Factors of the First-Order Steerable Differential Array With Microphone Mismatches: Deterministic and Worst-Case Analysis", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "300--315", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2506269", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Koutrouvelis:2016:FMH, author = "A. I. Koutrouvelis and G. P. Kafentzis and N. D. Gaubitch and R. Heusdens", title = "A Fast Method for High-Resolution Voiced\slash Unvoiced Detection and Glottal Closure\slash Opening Instant Estimation of Speech", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "316--328", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2506263", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nakamura:2016:RTA, author = "T. Nakamura and E. Nakamura and S. Sagayama", title = "Real-Time Audio-to-Score Alignment of Music Performances Containing Errors and Arbitrary Repeats and Skips", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "329--339", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2507862", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bahne:2016:OSL, author = "A. Bahne and A. Ahlen", title = "Optimizing the Similarity of Loudspeaker-Room Responses in Multiple Listening Positions", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "340--353", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2496156", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kates:2016:HAA, author = "J. M. Kates and K. H. Arehart", title = "The {Hearing-Aid Audio Quality Index (HAAQI)}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "354--365", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2507858", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schepker:2016:SPA, author = "H. Schepker and S. Doclo", title = "A Semidefinite Programming Approach to Min-max Estimation of the Common Part of Acoustic Feedback Paths in Hearing Aids", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "366--377", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2507940", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lee:2016:PLC, author = "Bong-Ki Lee and Joon-Hyuk Chang", title = "Packet Loss Concealment Based on Deep Neural Networks for Digital Speech Transmission", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "378--387", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2509780", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bentivogli:2016:EAM, author = "L. Bentivogli and N. Bertoldi and M. Cettolo and M. Federico and M. Negri and M. Turchi", title = "On the Evaluation of Adaptive Machine Translation for Human Post-Editing", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "388--399", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2509241", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATc, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Edics", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "400--401", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2519640", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IAb, author = "Anonymous", title = "Information for authors", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "402--403", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2519641", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:SISb, author = "Anonymous", title = "Special issue on sound scene and event analysis", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "404", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2519219", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:FCb, author = "Anonymous", title = "[{Front} cover]", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "C1", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2519650", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATd, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "C2", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2519638", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:ISPb, author = "Anonymous", title = "{IEEE Signal Processing Society} Information", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "C3", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2519639", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:BPb, author = "Anonymous", title = "[{Blank} page]", journal = j-IEEE-ACM-TASLP, volume = "24", number = "2", pages = "C4", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2519642", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Feb 9 07:50:48 MST 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCe, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "405--406", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2534598", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCf, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "407--408", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2534623", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sonnleitner:2016:RQB, author = "Reinhard Sonnleitner and Gerhard Widmer", title = "Robust Quad-Based Audio Fingerprinting", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "409--421", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2509248", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dong:2016:AMC, author = "Li Dong and Furu Wei and Ke Xu and Shixia Liu and Ming Zhou", title = "Adaptive Multi-Compositionality for Recursive Neural Network Models", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "422--431", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2509257", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lin:2016:UCL, author = "Zheng Lin and Xiaolong Jin and Xueke Xu and Yuanzhuo Wang and Xueqi Cheng and Weiping Wang and Dan Meng", title = "An Unsupervised Cross-Lingual Topic Model Framework for Sentiment Classification", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "432--444", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2512041", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nagathil:2016:SCR, author = "Anil Nagathil and Claus Weihs and Rainer Martin", title = "Spectral Complexity Reduction of Music Signals for Mitigating Effects of Cochlear Hearing Loss", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "445--458", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2511623", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tan:2016:CAT, author = "Tian Tan and Yanmin Qian and Kai Yu", title = "Cluster Adaptive Training for Deep Neural Network Based Acoustic Model", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "459--468", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2511922", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Leijon:2016:BAP, author = "Arne Leijon and Gustav Eje Henter and Martin Dahlquist", title = "{Bayesian} Analysis of Phoneme Confusion Matrices", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "469--482", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2512039", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Williamson:2016:CRM, author = "Donald S. Williamson and Yuxuan Wang and DeLiang Wang", title = "Complex Ratio Masking for Monaural Speech Separation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "483--492", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2512042", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Traa:2016:RSL, author = "Johannes Traa and David Wingate and Noah D. Stein and Paris Smaragdis", title = "Robust Source Localization and Enhancement With a Probabilistic Steered Response Power Model", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "493--503", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2512499", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shepstone:2016:TVM, author = "Sven Ewan Shepstone and Kong Aik Lee and Haizhou Li and Zheng-Hua Tan and S{\o}ren Holdt Jensen", title = "Total Variability Modeling Using Source-Specific Priors", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "504--517", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2515506", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schneider:2016:MAE, author = "Martin Schneider and Walter Kellermann", title = "Multichannel Acoustic Echo Cancellation in the Wave Domain With Increased Robustness to Nonuniqueness", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "518--529", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2515502", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{OHanlon:2016:NNG, author = "Ken O'Hanlon and Hidehisa Nagano and Nicolas Keriven and Mark D. Plumbley", title = "Non-Negative Group Sparsity with Subspace Note Modelling for Polyphonic Transcription", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "530--542", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2515514", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hadad:2016:BLB, author = "Elior Hadad and Simon Doclo and Sharon Gannot", title = "The Binaural {LCMV} Beamformer and its Performance Analysis", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "543--558", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2514496", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Grijalva:2016:MLA, author = "Felipe Grijalva and Luiz Martini and Dinei Florencio and Siome Goldenstein", title = "A Manifold Learning Approach for Personalizing {HRTFs} from Anthropometric Features", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "559--570", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2517565", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2016:CMB, author = "Lin Wang and Simon Doclo", title = "Correlation Maximization-Based Sampling Rate Offset Estimation for Distributed Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "571--582", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2517326", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Radmanesh:2016:LLO, author = "Nasim Radmanesh and Ian S. Burnett and Bhaskar D. Rao", title = "A Lasso-{LS} Optimization with a Frequency Variable Dictionary in a Multizone Sound System", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "583--593", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2518801", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2016:ABE, author = "Xin Liu and Changchun Bao", title = "Audio Bandwidth Extension Based on Ensemble Echo State Networks with Temporal Evolution", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "594--607", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2519146", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:ECIa, author = "Anonymous", title = "{EDICS} Categories for {IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "608--609", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2545440", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IAc, author = "Anonymous", title = "Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "610--611", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2545458", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:SISc, author = "Anonymous", title = "Special issue on sound scene and event analysis", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "612", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2545198", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IICa, author = "Anonymous", title = "Introducing {IEEE Collabratec}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "613", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2545158", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:FCc, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "C1", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2540778", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATe, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "C2", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2545082", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATf, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "3", pages = "C3", month = mar, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2545117", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:36 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCg, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "608--609", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2541258", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCh, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "610--611", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2541259", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2016:JAI, author = "Peifeng Li and Guodong Zhou", title = "Joint Argument Inference in {Chinese} Event Extraction with Argument Consistency and Event Relevance", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "612--622", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2497148", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2016:PAF, author = "Jianming Liu and Steven L. Grant", title = "Proportionate Adaptive Filtering for Block-Sparse System Identification", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "623--630", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2499602", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jensen:2016:NRO, author = "Jesper Rindom Jensen and Jacob Benesty and Mads Gr{\ae}sb{\o}ll Christensen", title = "Noise Reduction with Optimal Variable Span Linear Filters", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "631--644", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2505416", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Norholm:2016:ENS, author = "Sidsel Marie N{\o}rholm and Jesper Rindom Jensen and Mads Gr{\ae}sb{\o}ll Christensen", title = "Enhancement and Noise Statistics Estimation for Non-Stationary Voiced Speech", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "645--658", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2514492", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mehta:2016:RBV, author = "Daryush D. Mehta and Jarrad H. {Van Stan} and Robert E. Hillman", title = "Relationships Between Vocal Function Measures Derived from an Acoustic Microphone and a Subglottal Neck-Surface Accelerometer", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "659--668", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2516647", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kamper:2016:UWS, author = "Herman Kamper and Aren Jansen and Sharon Goldwater", title = "Unsupervised Word Segmentation and Lexicon Discovery Using Acoustic Word Embeddings", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "669--679", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2517567", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kodrasi:2016:JDN, author = "Ina Kodrasi and Simon Doclo", title = "Joint Dereverberation and Noise Reduction Based on Acoustic Multi-Channel Equalization", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "680--693", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2518804", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Palangi:2016:DSE, author = "Hamid Palangi and Li Deng and Yelong Shen and Jianfeng Gao and Xiaodong He and Jianshu Chen and Xinying Song and Rabab Ward", title = "Deep Sentence Embedding Using Long Short-Term Memory Networks: Analysis and Application to Information Retrieval", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "694--707", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2520371", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jeffet:2016:TPE, author = "Michael Jeffet and Noam R. Shabtai and Boaz Rafaely", title = "Theory and Perceptual Evaluation of the Binaural Reproduction and Beamforming Tradeoff in the Generalized Spherical Array Beamformer", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "708--718", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2522649", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Parada:2016:SCN, author = "Pablo Peso Parada and Dushyant Sharma and Jose Lainez and Daniel Barreda and Toon van Waterschoot and Patrick A. Naylor", title = "A Single-Channel Non-Intrusive {C50} Estimator Correlated With Speech Recognition Performance", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "719--732", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2521486", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Su:2016:ETT, author = "Ming-Hsiang Su and Chung-Hsien Wu and Yu-Ting Zheng", title = "Exploiting Turn-Taking Temporal Evolution for Personality Trait Perception in Dyadic Conversations", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "733--744", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2531286", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Abdul-Rauf:2016:EUI, author = "Sadaf Abdul-Rauf and Holger Schwenk and Patrik Lambert and Mohammad Nawaz", title = "Empirical Use of Information Retrieval to Build Synthetic Data for {SMT} Domain Adaptation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "745--754", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2517318", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Takamichi:2016:PMM, author = "Shinnosuke Takamichi and Tomoki Toda and Alan W. Black and Graham Neubig and Sakriani Sakti and Satoshi Nakamura", title = "Postfilters to Modify the Modulation Spectrum for Statistical Parametric Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "755--767", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2522655", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2016:AST, author = "Zhizheng Wu and Phillip L. {De Leon} and Cenk Demiroglu and Ali Khodabakhsh and Simon King and Zhen-Hua Ling and Daisuke Saito and Bryan Stewart and Tomoki Toda and Mirjam Wester and Junichi Yamagishi", title = "Anti-Spoofing for Text-Independent Speaker Verification: an Initial Database, Comparison of Countermeasures, and Human Performance", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "768--783", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2526653", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Andersen:2016:ATF, author = "Kristian Timm Andersen and Marc Moonen", title = "Adaptive Time-Frequency Analysis for Noise Reduction in an Audio Filter Bank With Low Delay", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "784--795", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2526779", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2016:JTF, author = "Zhong-Qiu Wang and DeLiang Wang", title = "A Joint Training Framework for Robust Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "796--806", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2528171", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Phan:2016:LRN, author = "Huy Phan and Lars Hertel and Marco Maass and Radoslaw Mazur and Alfred Mertins", title = "Learning Representations for Nonspeech Audio Events Through Their Similarities to Speech Patterns", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "807--822", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2530401", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:ECIb, author = "Anonymous", title = "{EDICS} Categories for {IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "823--824", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2542598", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IAd, author = "Anonymous", title = "Information for Authors", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "825--826", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2542618", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:SISd, author = "Anonymous", title = "Special issue on sound scene and event analysis", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "827", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2542599", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IICb, author = "Anonymous", title = "Introducing {IEEE Collabratec}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "828", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2545138", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:FCd, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "C1", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2542020", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATg, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "4", pages = "C2", month = apr, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2541023", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCi, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "829--830", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2556158", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCj, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "831--832", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2556178", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tsai:2016:REM, author = "T. J. Tsai and Andreas Stolcke", title = "Robust and Efficient Multiple Alignment of Unsynchronized Meeting Recordings", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "833--845", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2526787", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Receveur:2016:TAS, author = "Simon Receveur and Robin Wei{\ss} and Tim Fingscheidt", title = "Turbo Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "846--862", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2520364", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Marxer:2016:UIO, author = "Ricard Marxer and Hendrik Purwins", title = "Unsupervised Incremental Online Learning and Prediction of Musical Audio Signals", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "863--874", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2530409", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Adeli:2016:FBI, author = "Mohammad Adeli and Jean Rouat and Sean Wood and St{\'e}phane Molotchnikoff and Eric Plourde", title = "A Flexible Bio-Inspired Hierarchical Model for Analyzing Musical Timbre", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "875--889", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2530405", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2016:FFE, author = "Geliang Zhang and Simon Godsill", title = "Fundamental Frequency Estimation in Speech Signals With Variable Rate Particle Filters", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "890--900", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2531285", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kroher:2016:ATF, author = "Nadine Kroher and Emilia G{\'o}mez", title = "Automatic Transcription of Flamenco Singing From Polyphonic Music Recordings", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "901--913", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2531284", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Winter:2016:AMD, author = "Fiete Winter and Jens Ahrens and Sascha Spors", title = "On Analytic Methods for {$ 2.5$-D} Local Sound Field Synthesis Using Circular Distributions of Secondary Sources", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "914--926", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2531902", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sigtia:2016:EEN, author = "Siddharth Sigtia and Emmanouil Benetos and Simon Dixon", title = "An End-to-End Neural Network for Polyphonic Piano Music Transcription", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "927--939", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2533858", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Krawczyk-Becker:2016:FFI, author = "Martin Krawczyk-Becker and Timo Gerkmann", title = "Fundamental Frequency Informed Speech Enhancement in a Flexible Statistical Framework", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "940--951", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2533867", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Szurley:2016:BNC, author = "Joseph Szurley and Alexander Bertrand and Bas {Van Dijk} and Marc Moonen", title = "Binaural Noise Cue Preservation in a Binaural Noise Reduction System With a Remote Microphone Signal", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "952--966", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2535199", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2016:DEL, author = "Xiao-Lei Zhang and DeLiang Wang", title = "A Deep Ensemble Learning Method for Monaural Speech Separation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "967--977", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2536478", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2016:SDA, author = "Haotian Xu and Zhijian Ou", title = "Scalable Discovery of Audio Fingerprint Motifs in Broadcast Streams With Determinantal Point Process Based Motif Clustering", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "978--989", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2537203", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATh, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Edics", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "990--991", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2567059", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATi, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} information for authors", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "992--993", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2567060", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:SISe, author = "Anonymous", title = "Special issue on sound scene and event analysis", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "994", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2567140", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:SIBa, author = "Anonymous", title = "Special Issue on Biosignal-based Spoken Communication", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "995", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2567141", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:FCe, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "C1", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2561218", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATj, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "C2", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2566998", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IPEa, author = "Anonymous", title = "{IEEE Power Electronics Society} Information", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "C3", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2567018", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:BPc, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "24", number = "5", pages = "C4", month = may, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2567022", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:37 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCk, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "990--991", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2567338", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCl, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "992--993", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2567339", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Celikyilmaz:2016:EIW, author = "Asli Celikyilmaz and Ruhi Sarikaya and Minwoo Jeong and Anoop Deoras", title = "An Empirical Investigation of Word Class-Based Features for Natural Language Understanding", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "994--1005", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2015.2511925", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nguyen:2016:FAU, author = "Duc Hoang Ha Nguyen and Xiong Xiao and Eng Siong Chng and Haizhou Li", title = "Feature Adaptation Using Linear Spectro-Temporal Transform for Robust Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1006--1019", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2522646", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qian:2016:TPF, author = "Xiaojun Qian and Helen Meng and Frank Soong", title = "A Two-Pass Framework of Mispronunciation Detection and Diagnosis for Computer-Aided Pronunciation Training", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1020--1028", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2526782", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2016:TIP, author = "Lijiang Chen and Xia Mao and Hong Yan", title = "Text-Independent Phoneme Segmentation Combining {EGG} and Speech Data", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1029--1037", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2533865", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tavakoli:2016:FSE, author = "Vincent Mohammad Tavakoli and Jesper Rindom Jensen and Mads Gr{\ae}sb{\o}ll Christensen and Jacob Benesty", title = "A Framework for Speech Enhancement With Ad Hoc Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1038--1051", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2537202", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2016:CEP, author = "Yan-You Chen and Chung-Hsien Wu and Yi-Chin Huang and Shih-Lun Lin and Jhing-Fa Wang", title = "Candidate Expansion and Prosody Adjustment for Natural Speech Synthesis Using a Small Corpus", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1052--1065", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2537982", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2016:PAU, author = "Xueliang Zhang and Hui Zhang and Shuai Nie and Guanglai Gao and Wenju Liu", title = "A Pairwise Algorithm Using the Deep Stacking Network for Speech Separation and Pitch Estimation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1066--1078", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2540805", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2016:IAS, author = "Lin Wang and Tsz-Kin Hon and Joshua D. Reiss and Andrea Cavallaro", title = "An Iterative Approach to Source Counting and Localization Using Two Distant Microphones", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1079--1093", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2533859", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{OLeary:2016:MAS, author = "Se{\'a}n O'Leary and Axel R{\"o}bel", title = "A Montage Approach to Sound Texture Synthesis", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1094--1105", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2536481", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ouali:2016:FAF, author = "Chahid Ouali and Pierre Dumouchel and Vishwa Gupta", title = "Fast Audio Fingerprinting System Using {GPU} and a Clustering-Based Technique", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1106--1118", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2541303", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Raposo:2016:UGS, author = "Francisco Raposo and Ricardo Ribeiro and David Martins de Matos", title = "Using Generic Summarization to Improve Music Information Retrieval Tasks", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1119--1128", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2541299", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2016:ISU, author = "Lantian Li and Dong Wang and Chenhao Zhang and Thomas Fang Zheng", title = "Improving Short Utterance Speaker Recognition by Modeling Speech Unit Classes", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1129--1139", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2544660", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Taghia:2016:FDA, author = "Jalal Taghia and Rainer Martin", title = "A Frequency-Domain Adaptive Line Enhancer With Step-Size Control Based on Mutual Information for Harmonic Noise Reduction", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1140--1154", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2545920", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATk, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Edics", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1155--1156", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2567058", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATl, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} information for authors", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1157--1158", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2567118", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:SISf, author = "Anonymous", title = "Special issue on sound scene and event analysis", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1159", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2567102", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:SIBb, author = "Anonymous", title = "Special Issue on Biosignal-based Spoken Communication", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "1160", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2567139", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:FCf, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "C1", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2561219", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATm, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} publication information", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "C2", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2567039", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IPEb, author = "Anonymous", title = "{IEEE Power Electronics Society} Information", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "C3", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2568018", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:BPd, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "24", number = "6", pages = "C4", month = jun, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2568019", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gao:2016:SSA, author = "Min Gao and Jing Lu and Xiaojun Qiu", title = "A Simplified Subband {ANC} Algorithm Without Secondary Path Modeling", journal = j-IEEE-ACM-TASLP, volume = "24", number = "7", pages = "1164--1174", month = jul, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2516439", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Aihara:2016:MNN, author = "Ryo Aihara and Tetsuya Takiguchi and Yasuo Ariki", title = "Multiple Non-Negative Matrix Factorization for Many-to-Many Voice Conversion", journal = j-IEEE-ACM-TASLP, volume = "24", number = "7", pages = "1175--1184", month = jul, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2522643", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2016:TDB, author = "Kai Chen and Qiang Huo", title = "Training Deep Bidirectional {LSTM} Acoustic Model for {LVCSR} by a Context-Sensitive-Chunk {BPTT} Approach", journal = j-IEEE-ACM-TASLP, volume = "24", number = "7", pages = "1185--1193", month = jul, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2539499", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Stafylakis:2016:TDS, author = "Themos Stafylakis and Md. Jahangir Alam and Patrick Kenny", title = "Text-Dependent Speaker Recognition With Random Digit Strings", journal = j-IEEE-ACM-TASLP, volume = "24", number = "7", pages = "1194--1203", month = jul, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2546458", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Deepak:2016:FSS, author = "K. T. Deepak and S. R. Mahadeva Prasanna", title = "Foreground Speech Segmentation and Enhancement Using Glottal Closure Instants and Mel Cepstral Coefficients", journal = j-IEEE-ACM-TASLP, volume = "24", number = "7", pages = "1204--1218", month = jul, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2549699", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hajimolahoseini:2016:RET, author = "Habib Hajimolahoseini and Rassoul Amirfattahi and Saeed Gazor and Hamid Soltanian-Zadeh", title = "Robust Estimation and Tracking of Pitch Period Using an Efficient {Bayesian} Filter", journal = j-IEEE-ACM-TASLP, volume = "24", number = "7", pages = "1219--1229", month = jul, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2551041", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sahoo:2016:NMG, author = "Subhasmita Sahoo and Aurobinda Routray", title = "A Novel Method of Glottal Inverse Filtering", journal = j-IEEE-ACM-TASLP, volume = "24", number = "7", pages = "1230--1241", month = jul, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2551864", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Degottex:2016:MFA, author = "Gilles Degottex and Luc Ardaillon and Axel Roebel", title = "Multi-Frame Amplitude Envelope Estimation for Modification of Singing Voice", journal = j-IEEE-ACM-TASLP, volume = "24", number = "7", pages = "1242--1254", month = jul, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2551863", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2016:ITM, author = "Zhizheng Wu and Simon King", title = "Improving Trajectory Modelling for {DNN}-Based Speech Synthesis by Using Stacked Bottleneck Features and Minimum Generation Error Training", journal = j-IEEE-ACM-TASLP, volume = "24", number = "7", pages = "1255--1265", month = jul, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2551865", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jaureguiberry:2016:FMS, author = "Xabier Jaureguiberry and Emmanuel Vincent and Ga{\"e}l Richard", title = "Fusion Methods for Speech Enhancement and Audio Source Separation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "7", pages = "1266--1279", month = jul, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2553441", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Das:2016:IPP, author = "Rajib Lochan Das and Mrityunjoy Chakraborty", title = "Improving the Performance of the {PNLMS} Algorithm Using Norm Regularization", journal = j-IEEE-ACM-TASLP, volume = "24", number = "7", pages = "1280--1290", month = jul, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2552578", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Taseska:2016:SSF, author = "Maja Taseska and Emanu{\"e}l A. P. Habets", title = "Spotforming: Spatial Filtering With Distributed Arrays for Position-Selective Sound Acquisition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "7", pages = "1291--1304", month = jul, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2540815", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2016:LMT, author = "Guangyou Zhou and Zhiwen Xie and Tingting He and Jun Zhao and Xiaohua Tony Hu", title = "Learning the Multilingual Translation Representations for Question Retrieval in Community Question Answering via Non-Negative Matrix Factorization", journal = j-IEEE-ACM-TASLP, volume = "24", number = "7", pages = "1305--1314", month = jul, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2544661", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kim:2016:PNC, author = "Chanwoo Kim and Richard M. Stern", title = "Power-Normalized Cepstral Coefficients {(PNCC)} for Robust Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "7", pages = "1315--1329", month = jul, year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2545928", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:38 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schepker:2016:LSE, author = "Henning Schepker and Simon Doclo", title = "Least-Squares Estimation of the Common Pole-Zero Filter of Acoustic Feedback Paths in Hearing Aids", journal = j-IEEE-ACM-TASLP, volume = "24", number = "8", pages = "1334--1347", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2554288", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:39 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pessentheiner:2016:LCM, author = "Hannes Pessentheiner and Martin Hagm{\"u}ller and Gernot Kubin", title = "Localization and Characterization of Multiple Harmonic Sources", journal = j-IEEE-ACM-TASLP, volume = "24", number = "8", pages = "1348--1363", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2556282", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:39 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Khalilian:2016:CLP, author = "Hanieh Khalilian and Ivan V. Baji{\'c} and Rodney G. Vaughan", title = "Comparison of Loudspeaker Placement Methods for Sound Field Reproduction", journal = j-IEEE-ACM-TASLP, volume = "24", number = "8", pages = "1364--1379", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2556860", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:39 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2016:SAS, author = "Cheng-Yen Yang and Chih-Wei Liu and Shyh-Jye Jou", title = "A Systematic {ANSI S1.11} Filter Bank Specification Relaxation and Its Efficient Multirate Architecture for Hearing-Aid Systems", journal = j-IEEE-ACM-TASLP, volume = "24", number = "8", pages = "1380--1392", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2556422", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:39 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Laufer-Goldshtein:2016:SSS, author = "Bracha Laufer-Goldshtein and Ronen Talmon and Sharon Gannot", title = "Semi-Supervised Sound Source Localization Based on Manifold Regularization", journal = j-IEEE-ACM-TASLP, volume = "24", number = "8", pages = "1393--1407", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2555085", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:39 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kounades-Bastian:2016:VEA, author = "Dionyssos Kounades-Bastian and Laurent Girin and Xavier Alameda-Pineda and Sharon Gannot and Radu Horaud", title = "A Variational {EM} Algorithm for the Separation of Time-Varying Convolutive Audio Mixtures", journal = j-IEEE-ACM-TASLP, volume = "24", number = "8", pages = "1408--1423", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2554286", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:39 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Du:2016:RAS, author = "Jun Du and Yanhui Tu and Li-Rong Dai and Chin-Hui Lee", title = "A Regression Approach to Single-Channel Speech Separation Via High-Resolution Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "24", number = "8", pages = "1424--1437", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2558822", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:39 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2016:TEL, author = "Xunying Liu and Xie Chen and Yongqiang Wang and Mark J. F. Gales and Philip C. Woodland", title = "Two Efficient Lattice Rescoring Methods Using Recurrent Neural Network Language Models", journal = j-IEEE-ACM-TASLP, volume = "24", number = "8", pages = "1438--1449", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2558826", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:39 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Swietojanski:2016:LHU, author = "Pawel Swietojanski and Jinyu Li and Steve Renals", title = "Learning Hidden Unit Contributions for Unsupervised Acoustic Model Adaptation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "8", pages = "1450--1463", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2560534", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:39 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2016:LRF, author = "Meng Zhang and Yang Liu and Huanbo Luan and Maosong Sun", title = "Listwise Ranking Functions for Statistical Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "8", pages = "1464--1472", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2560527", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed Jun 8 09:17:39 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCm, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1477--1478", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2599056", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCn, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1479--1480", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2599098", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cavalieri:2016:CLM, author = "Daniel C. Cavalieri and Sira E. Palazuelos-Cagigas and Teodiano F. Bastos-Filho and M{\'a}rio Sarcinelli-Filho", title = "Combination of Language Models for Word Prediction: An Exponential Approach", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1481--1494", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2547743", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schwartz:2016:EMA, author = "Ofer Schwartz and Sharon Gannot and Emanu{\"e}l A. P. Habets", title = "An Expectation-Maximization Algorithm for Multimicrophone Speech Dereverberation and Noise Reduction With Coherence Matrix Estimation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1495--1510", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2553457", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Delikaris-Manias:2016:SDS, author = "Symeon Delikaris-Manias and Juha Vilkamo and Ville Pulkki", title = "Signal-Dependent Spatial Filtering Based on Weighted-Orthogonal Beamformers in the Spherical Harmonic Domain", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1511--1523", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2560523", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2016:SSA, author = "Sheng Li and Yuya Akita and Tatsuya Kawahara", title = "Semi-Supervised Acoustic Model Training by Discriminative Data Selection From Multiple {ASR} Systems' Hypotheses", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1524--1534", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2562505", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dittmar:2016:REA, author = "Christian Dittmar and Meinard M{\"u}ller", title = "Reverse Engineering the Amen Break --- Score-Informed Separation and Restoration Applied to Drum Recordings", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1535--1547", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2567645", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pan:2016:ROR, author = "Chao Pan and Jingdong Chen and Jacob Benesty", title = "Reduced-Order Robust Superdirective Beamforming With Uniform Linear Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1548--1559", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2568044", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{FitzGerald:2016:PBD, author = "Derry FitzGerald and Antoine Liutkus and Roland Badeau", title = "Projection-Based Demixing of Spatial Audio", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1560--1572", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2570945", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2016:DSS, author = "Lin Wang and Joshua D. Reiss and Andrea Cavallaro", title = "Over-Determined Source Separation and Localization Using Distributed Microphones", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1573--1588", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2573048", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2016:RCM, author = "Yang Liu and Sujian Li and Furu Wei and Heng Ji", title = "Relation Classification Via Modeling Augmented Dependency Paths", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1589--1598", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2573050", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kuklasinski:2016:MLP, author = "Adam Kuklasi{\'n}ski and Simon Doclo and S{\o}ren Holdt Jensen and Jesper Jensen", title = "Maximum Likelihood {PSD} Estimation for Speech Enhancement in Reverberation and Noise", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1599--1612", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2573591", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Karimian-Azari:2016:CEN, author = "Sam Karimian-Azari and Jesper Rindom Jensen and Mads Gr{\ae}sb{\o}ll Christensen", title = "Computationally Efficient and Noise Robust {DOA} and Pitch Estimation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1613--1625", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2577501", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kitamura:2016:DBS, author = "Daichi Kitamura and Nobutaka Ono and Hiroshi Sawada and Hirokazu Kameoka and Hiroshi Saruwatari", title = "Determined Blind Source Separation Unifying Independent Vector Analysis and Nonnegative Matrix Factorization", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1626--1641", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2577880", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Obin:2016:SSA, author = "Nicolas Obin and Axel Roebel", title = "Similarity Search of Acted Voices for Automatic Voice Casting", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1642--1651", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2580302", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nugraha:2016:MAS, author = "Aditya Arie Nugraha and Antoine Liutkus and Emmanuel Vincent", title = "Multichannel Audio Source Separation With Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1652--1664", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2580946", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shum:2016:UAU, author = "Stephen H. Shum and David F. Harwath and Najim Dehak and James R. Glass", title = "On the Use of Acoustic Unit Discovery for Language Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1665--1676", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2582260", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATn, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1677--1678", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607844", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:ITMa, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1679--1680", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607846", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IIPa, author = "Anonymous", title = "Introducing the {IEEE PES Resource Center}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "1681", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2593548", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:FCg, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "C1", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607904", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:ISPc, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "C2", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2598118", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:ISPd, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "C3", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607848", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:BPe, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "24", number = "9", pages = "C4", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607850", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCo, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1677--1678", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607941", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCp, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1679--1680", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607939", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Eaton:2016:ERA, author = "James Eaton and Nikolay D. Gaubitch and Alastair H. Moore and Patrick A. Naylor", title = "Estimation of Room Acoustic Parameters: The {ACE} Challenge", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1681--1693", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2577502", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nose:2016:EIG, author = "Takashi Nose", title = "Efficient Implementation of Global Variance Compensation for Parametric Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1694--1704", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2580298", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ghaffarzadegan:2016:GMP, author = "Shabnam Ghaffarzadegan and Hynek Bo{\v{r}}il and John H. L. Hansen", title = "Generative Modeling of Pseudo-Whisper for Robust Whispered Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1705--1720", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2580944", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mirsamadi:2016:GNT, author = "Seyedmahdad Mirsamadi and John H. L. Hansen", title = "A Generalized Nonnegative Tensor Factorization Approach for Distant Speech Recognition With Distributed Microphones", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1721--1731", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2580943", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fuster:2016:AFX, author = "Laura Fuster and Maria de Diego and Luis A. Azpicueta-Ruiz and Miguel Ferrer", title = "Adaptive Filtered-x Algorithms for Room Equalization Based on Block-Based Combination Schemes", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1732--1745", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2583065", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Adiloglu:2016:VBI, author = "Kamil Adilo{\u{g}}lu and Emmanuel Vincent", title = "Variational {Bayesian} Inference for Source Separation and Robust Feature Extraction", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1746--1758", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2583794", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kortlang:2016:AMB, author = "Steffen Kortlang and Giso Grimm and Volker Hohmann and Birger Kollmeier and Stephan D. Ewert", title = "Auditory Model-Based Dynamic Compression Controlled by Subband Instantaneous Frequency and Speech Presence Probability Estimates", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1759--1772", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2584705", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Swietojanski:2016:DPU, author = "Pawel Swietojanski and Steve Renals", title = "Differentiable Pooling for Unsupervised Acoustic Model Adaptation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1773--1784", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2584700", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Niwa:2016:OMA, author = "Kenta Niwa and Yusuke Hioka and Kazunori Kobayashi", title = "Optimal Microphone Array Observation for Clear Recording of Distant Sound Sources", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1785--1795", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2585879", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Epain:2016:SHS, author = "Nicolas Epain and Craig T. Jin", title = "Spherical Harmonic Signal Covariance and Sound Field Diffuseness", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1796--1807", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2585862", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zorila:2016:NFF, author = "Tudor-C{\u{a}}t{\u{a}}lin Zoril{\u{a}} and Yannis Stylianou and Tatsuma Ishihara and Masami Akamine", title = "Near and Far Field Speech-in-Noise Intelligibility Improvements Based on a Time--Frequency Energy Reallocation Approach", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1808--1818", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2585864", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ma:2016:SWM, author = "Xi Ma and Dong Wang and Javier Tejedor", title = "Similar Word Model for Unfrequent Word Enhancement in Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1819--1830", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2585863", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bokaei:2016:SMT, author = "Mohammad Hadi Bokaei and Hossein Sameti and Yang Liu", title = "Summarizing Meeting Transcripts Based on Functional Segmentation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1831--1841", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2585859", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2016:ACL, author = "Jiajun Zhang and Yu Zhou and Chengqing Zong", title = "Abstractive Cross-Language Summarization via Translation Model Enhanced Predicate Argument Structure Fusing", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1842--1853", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2586608", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lafay:2016:MMS, author = "Gr{\'e}goire Lafay and Mathieu Lagrange and Mathias Rossignol and Emmanouil Benetos and Axel Roebel", title = "A Morphological Model for Simulating Acoustic Scenes and Its Application to Sound Event Detection", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1854--1864", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2587218", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ji:2016:PRS, author = "An Ji and Michael T. Johnson and Jeffrey J. Berry", title = "Parallel Reference Speaker Weighting for Kinematic-Independent Acoustic-to-Articulatory Inversion", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1865--1875", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2588340", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IATo, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1876--1877", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607881", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:ITMb, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1878--1879", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607883", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:IIPb, author = "Anonymous", title = "Introducing the {IEEE PES Resource Center}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "1880", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607899", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:FCh, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "C1", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607906", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:ISPe, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "C2", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607859", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:ISPf, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "C3", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607885", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:BPf, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "24", number = "10", pages = "C4", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607887", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:17 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCq, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "1881--1882", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2618239", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2016:TCr, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "1883--1884", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2618225", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gkiokas:2016:TMP, author = "Aggelos Gkiokas and Vassilis Katsouros and George Carayannis", title = "Towards Multi-Purpose Spectral Rhythm Features: An Application to Dance Style, Meter and Tempo Estimation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "1885--1896", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2554283", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Huang:2016:IMP, author = "Yi-Chin Huang and Chung-Hsien Wu and Si-Ting Weng", title = "Improving {Mandarin} Prosody Generation Using Alternative Smoothing Techniques", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "1897--1907", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2588727", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Andersen:2016:PIN, author = "Asger Heidemann Andersen and Jan Mark de Haan and Zheng-Hua Tan and Jesper Jensen", title = "Predicting the Intelligibility of Noisy and Nonlinearly Processed Binaural Speech", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "1908--1920", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2588002", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2016:DMA, author = "Qiaoling Zhang and Zhe Chen and Fuliang Yin", title = "Distributed Marginalized Auxiliary Particle Filter for Speaker Tracking in Distributed Microphone Networks", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "1921--1934", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2590146", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ferras:2016:SDL, author = "Marc Ferr{\`a}s and Srikanth Madikeri and Herv{\'e} Bourlard", title = "Speaker Diarization and Linking of Meeting Data", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "1935--1945", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2590139", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2016:GBS, author = "Yuzong Liu and Katrin Kirchhoff", title = "Graph-Based Semisupervised Learning for Acoustic Modeling in Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "1946--1956", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2593800", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2016:CBW, author = "Jin Wang and Liang-Chih Yu and K. Robert Lai and Xuejie Zhang", title = "Community-Based Weighted Graph Model for Valence-Arousal Prediction of Affective Words", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "1957--1968", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2594287", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Carini:2016:RRI, author = "Alberto Carini and Stefania Cecchi and Laura Romoli", title = "Robust Room Impulse Response Measurement Using Perfect Sequences for {Legendre} Nonlinear Filters", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "1969--1982", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2593803", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ewert:2016:PTS, author = "Sebastian Ewert and Mark Sandler", title = "Piano Transcription in the Studio Using an Extensible Alternating Directions Framework", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "1983--1997", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2593801", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chien:2016:ALA, author = "Yu-Ren Chien and Hsin-Min Wang and Shyh-Kang Jeng", title = "Alignment of Lyrics With Accompanied Singing Audio Based on Acoustic-Phonetic Vowel Likelihood Modeling", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "1998--2008", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2594282", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jensen:2016:API, author = "Jesper Jensen and Cees H. Taal", title = "An Algorithm for Predicting the Intelligibility of Speech Masked by Modulated Noise Maskers", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "2009--2022", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2585878", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cui:2016:MLN, author = "Xiaodong Cui and Vaibhava Goel", title = "Maximum Likelihood Nonlinear Transformations Based on Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "2023--2031", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2594255", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", note = "See correction \cite{Kuklasinski:2017:CTM}.", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nakashika:2016:NPT, author = "Toru Nakashika and Tetsuya Takiguchi and Yasuhiro Minami", title = "Non-Parallel Training in Voice Conversion Using an Adaptive Restricted {Boltzmann} Machine", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "2032--2045", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2593263", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liao:2016:SAS, author = "I-Bin Liao and Chen-Yu Chiang and Yih-Ru Wang and Sin-Horng Chen", title = "Speaker Adaptation of {SR-HPM} for Speaking Rate-Controlled {Mandarin} {TTS}", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "2046--2058", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2598307", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ouchi:2016:TBD, author = "Hiroki Ouchi and Kevin Duh and Hiroyuki Shindo and Yuji Matsumoto", title = "Transition-Based Dependency Parsing Exploiting Supertags", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "2059--2068", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2598310", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xiao:2016:LAA, author = "Tong Xiao and Derek F. Wong and Jingbo Zhu", title = "A Loss-Augmented Approach to Training Syntactic Machine Translation Systems", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "2069--2083", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2594383", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ikemiya:2016:SVS, author = "Yukara Ikemiya and Katsutoshi Itoyama and Kazuyoshi Yoshii", title = "Singing Voice Separation and Vocal {F0} Estimation Based on Mutual Combination of Robust Principal Component Analysis and Subharmonic Summation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "2084--2095", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2577879", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sigtia:2016:AES, author = "Siddharth Sigtia and Adam M. Stark and Sacha Krstulovi{\'c} and Mark D. Plumbley", title = "Automatic Environmental Sound Recognition: Performance Versus Computational Cost", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "2096--2107", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2592698", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Parthasarathy:2016:UAD, author = "Srinivas Parthasarathy and Roddy Cowie and Carlos Busso", title = "Using Agreement on Direction of Change to Build Rank-Based Emotion Classifiers", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "2108--2121", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2593944", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2016:CSB, author = "Jia-Ching Wang and Yuan-Shan Lee and Chang-Hong Lin and Shu-Fan Wang and Chih-Hao Shih and Chung-Hsien Wu", title = "Compressive Sensing-Based Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "2122--2131", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2598306", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2016:REJ, author = "Siying Wang and Sebastian Ewert and Simon Dixon", title = "Robust and Efficient Joint Alignment of Multiple Musical Performances", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "2132--2145", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2598318", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2016:ETE, author = "Xie Chen and Xunying Liu and Yongqiang Wang and Mark J. F. Gales and Philip C. Woodland", title = "Efficient Training and Evaluation of Recurrent Neural Network Language Models for Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "2146--2157", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2598304", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jao:2016:MMS, author = "Ping-Keng Jao and Li Su and Yi-Hsuan Yang and Brendt Wohlberg", title = "Monaural Music Source Separation Using Convolutional Sparse Coding", journal = j-IEEE-ACM-TASLP, volume = "24", number = "11", pages = "2158--2170", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2598323", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cogliati:2016:CDP, author = "Andrea Cogliati and Zhiyao Duan and Brendt Wohlberg", title = "Context-Dependent Piano Music Transcription With Convolutional Sparse Coding", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2218--2230", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2598305", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qian:2016:NNB, author = "Yanmin Qian and Tian Tan and Dong Yu", title = "Neural Network Based Multi-Factor Aware Joint Training for Robust Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2231--2240", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2598308", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Samarakoon:2016:FHL, author = "Lahiru Samarakoon and Khe Chai Sim", title = "Factorized Hidden Layer Adaptation for Deep Neural Network Based Acoustic Modeling", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2241--2250", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2601146", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Krawczyk-Becker:2016:MBE, author = "Martin Krawczyk-Becker and Timo Gerkmann", title = "On {MMSE}-Based Estimation of Amplitude and Complex Speech Spectral Coefficients Under Phase-Uncertainty", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2251--2262", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2602549", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qian:2016:VDC, author = "Yanmin Qian and Mengxiao Bi and Tian Tan and Kai Yu", title = "Very Deep Convolutional Neural Networks for Noise Robust Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2263--2276", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2602884", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2016:GAA, author = "Yi-Chan Wu and Homer H. Chen", title = "Generation of Affective Accompaniment in Accordance With Emotion Flow", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2277--2287", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2603006", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Movassagh:2016:SAC, author = "Mahmood Movassagh and Peter Kabal", title = "Scalable Audio Coding Using {Trellis}-Based Optimized Joint Entropy Coding and Quantization", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2288--2300", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607339", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cernak:2016:CDS, author = "Milos Cernak and Alexandros Lazaridis and Afsaneh Asaei and Philip N. Garner", title = "Composition of Deep and Spiking Neural Networks for Very Low Bit Rate Speech Coding", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2301--2312", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2604566", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dov:2016:KMV, author = "David Dov and Ronen Talmon and Israel Cohen", title = "Kernel Method for Voice Activity Detection in the Presence of Transients", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2313--2326", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2566919", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Villalba:2016:BNM, author = "Jes{\'u}s Villalba and Antonio Miguel and Alfonso Ortega and Eduardo Lleida", title = "{Bayesian} Networks to Model the Variability of Speaker Verification Scores in Adverse Environments", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2327--2340", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607343", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sailor:2016:NUA, author = "Hardik B. Sailor and Hemant A. Patil", title = "Novel Unsupervised Auditory Filterbank Learning Using Convolutional {RBM} for Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2341--2353", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2607341", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Norholm:2016:IFF, author = "Sidsel Marie N{\o}rholm and Jesper Rindom Jensen and Mads Gr{\ae}sb{\o}ll Christensen", title = "Instantaneous Fundamental Frequency Estimation With Optimal Segmentation for Nonstationary Voiced Speech", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2354--2367", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2608948", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2016:RVS, author = "Sheng Zhang and Jiashu Zhang and Hongyu Han", title = "Robust Variable Step-Size Decorrelation Normalized Least-Mean-Square Algorithm and its Application to Acoustic Echo Cancellation", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2368--2376", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2556280", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Barker:2016:BSA, author = "Tom Barker and Tuomas Virtanen", title = "Blind Separation of Audio Mixtures Through Nonnegative Tensor Factorization of Modulation Spectrograms", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2377--2389", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2602546", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2016:ACM, author = "Jinxin Liu and Xuefeng Chen", title = "Adaptive Compensation of Misequalization in Narrowband Active Noise Equalizer Systems", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2390--2399", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2604212", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ogawa:2016:ESR, author = "Atsunori Ogawa and Takaaki Hori and Atsushi Nakamura", title = "Estimating Speech Recognition Accuracy Based on Error Type Classification", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2400--2413", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2603599", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kelly:2016:SAC, author = "Finnian Kelly and John H. L. Hansen", title = "Score-Aging Calibration for Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2414--2424", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2602542", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2016:ASF, author = "Bochen Li and Zhiyao Duan", title = "An Approach to Score Following for Piano Performances With the Sustained Effect", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2425--2438", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2611938", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Moritz:2016:IOM, author = "Niko Moritz and Birger Kollmeier and J{\"o}rn Anem{\"u}ller", title = "Integration of Optimized Modulation Filter Sets Into Deep Neural Networks for Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2439--2452", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2615239", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Leglaive:2016:MAS, author = "Simon Leglaive and Roland Badeau and Ga{\"e}l Richard", title = "Multichannel Audio Source Separation With Probabilistic Reverberation Priors", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2453--2465", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2614140", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tervo:2016:SSD, author = "Sakari Tervo", title = "Single Snapshot Detection and Estimation of Reflections From Room Impulse Responses in the Spherical Harmonic Domain", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2466--2480", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2615238", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Markovic:2016:EAS, author = "Dejan Markovi{\'c} and Fabio Antonacci and Lucio Bianchi and Stefano Tubaro and Augusto Sarti", title = "Extraction of Acoustic Sources Through the Processing of Sound Field Maps in the Ray Space", journal = j-IEEE-ACM-TASLP, volume = "24", number = "12", pages = "2481--2494", month = "????", year = "2016", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2615242", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Tue Oct 25 08:43:18 MDT 2016", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCa, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "222--223", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2651831", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCb, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "224--225", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2651833", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2017:DRE, author = "Hanchi Chen and Thushara Dheemantha Abhayapala and Prasanga N. Samarasinghe and Wen Zhang", title = "Direct-to-Reverberant Energy Ratio Estimation Using a First-Order Microphone", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "226--237", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2601222", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bell:2017:MLC, author = "Peter Bell and Pawel Swietojanski and Steve Renals", title = "Multitask Learning of Context-Dependent Targets in Deep Neural Network Acoustic Models", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "238--247", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2630305", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2017:TAD, author = "Rui Zhao and Kezhi Mao", title = "Topic-Aware Deep Compositional Models for Sentence Classification", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "248--260", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2632521", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{ElBadawy:2017:FAS, author = "Dalia {El Badawy} and Ngoc Q. K. Duong and Alexey Ozerov", title = "On-the-Fly Audio Source Separation --- A Novel User-Friendly Framework", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "261--272", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2632528", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Elvander:2017:OEM, author = "Filip Elvander and Johan Sw{\"a}rd and Andreas Jakobsson", title = "Online Estimation of Multiple Harmonic Signals", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "273--284", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2634118", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Renkens:2017:WSL, author = "Vincent Renkens and Hugo {Van hamme}", title = "Weakly Supervised Learning of Hidden {Markov} Models for Spoken Language Acquisition", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "285--295", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2633812", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Remaggi:2017:ARL, author = "Luca Remaggi and Philip J. B. Jackson and Philip Coleman and Wenwu Wang", title = "Acoustic Reflector Localization: Novel Image Source Reversion and Direct Localization Methods", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "296--309", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2633802", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Samarasinghe:2017:EDR, author = "Prasanga N. Samarasinghe and Thushara D. Abhayapala and Hanchi Chen", title = "Estimating the Direct-to-Reverberant Energy Ratio Using a Spherical Harmonics-Based Spatial Correlation Model", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "310--319", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2633811", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Markovich-Golan:2017:CLT, author = "Shmulik Markovich-Golan and Sharon Gannot and Walter Kellermann", title = "Combined {LCMV-TRINICON} Beamforming for Separating Multiple Speech Sources in Noisy and Reverberant Environments", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "320--332", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2633806", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ahmed:2017:GSA, author = "Shakeel Ahmed and Muhammad Tahir Akhtar", title = "Gain Scheduling of Auxiliary Noise and Variable Step-Size for Online Acoustic Feedback Cancellation in Narrow-Band Active Noise Control Systems", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "333--343", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2635029", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sargent:2017:ESS, author = "Gabriel Sargent and Fr{\'e}d{\'e}ric Bimbot and Emmanuel Vincent", title = "Estimating the Structural Segmentation of Popular Music Pieces Under Regularity Constraints", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "344--358", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2635031", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cheer:2017:IDS, author = "Jordan Cheer and Stephen Daley", title = "An Investigation of Delayless Subband Adaptive Filtering for Multi-Input Multi-Output Active Noise Control Applications", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "359--373", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2637298", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schlecht:2017:FDN, author = "Sebastian J. Schlecht and Emanu{\"e}l A. P. Habets", title = "Feedback Delay Networks: Echo Density and Mixing Time", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "374--383", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2635027", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Abel:2017:IQM, author = "Johannes Abel and Magdalena Kaniewska and Cyril Guillaum{\'e} and Wouter Tirry and Tim Fingscheidt", title = "An Instrumental Quality Measure for Artificially Bandwidth-Extended Speech Signals", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "384--396", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2635022", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rehr:2017:AAR, author = "Robert Rehr and Timo Gerkmann", title = "An Analysis of Adaptive Recursive Smoothing with Applications to Noise {PSD} Estimation", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "397--408", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2633803", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Granell:2017:MCT, author = "Emilio Granell and Carlos-D. Mart{\'\i}nez-Hinarejos", title = "Multimodal Crowdsourcing for Transcribing Handwritten Documents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "409--419", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2634123", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ma:2017:NSO, author = "Yaping Ma and Yegui Xiao", title = "A New Strategy for Online Secondary-Path Modeling of Narrowband Active Noise Control", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "420--434", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2633799", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Belloch:2017:GBD, author = "Jose A. Belloch and Alberto Gonzalez and Enrique S. Quintana-Ort{\'\i} and Miguel Ferrer and Vesa V{\"a}lim{\"a}ki", title = "{GPU}-Based Dynamic Wave Field Synthesis Using Fractional Delay Filters and Room Compensation", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "435--447", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2631338", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IATa, author = "Anonymous", title = "{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing} Edics", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "448--449", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2651844", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ITMa, author = "Anonymous", title = "{IEEE} Transactions on Multimedia information for authors", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "450--451", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2651846", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IICa, author = "Anonymous", title = "Introducing {IEEE Collabratec}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "452", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2653961", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:FCa, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "C1", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2651840", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPa, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "2", pages = "C2", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2651842", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCc, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "3--4", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2671139", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:46 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCd, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "3--4", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2671141", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:46 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCe, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "3--4", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2671139", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCf, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "3--4", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2671141", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{He:2017:MUA, author = "Qi He and Feng Bao and Changchun Bao", title = "Multiplicative Update of Auto-Regressive Gains for Codebook-Based Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "457--468", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2636445", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2017:EAC, author = "Zhongqing Wang and Sophia Yat Mei Lee and Shoushan Li and Guodong Zhou", title = "Emotion Analysis in Code-Switching Text With Joint Factor Graph Model", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "469--480", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2637280", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bellur:2017:FDS, author = "Ashwin Bellur and Mounya Elhilali", title = "Feedback-Driven Sensory Mapping Adaptation for Robust Speech Activity Detection", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "481--492", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2639322", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tang:2017:CJT, author = "Zhiyuan Tang and Lantian Li and Dong Wang and Ravichander Vipperla", title = "Collaborative Joint Training With Multitask Recurrent Model for Speech and Speaker Recognition", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "493--504", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2639323", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sharma:2017:SMU, author = "Bidisha Sharma and S. R. Mahadeva Prasanna", title = "Sonority Measurement Using System, Source, and Suprasegmental Information", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "505--518", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2641901", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lee:2017:PRN, author = "Hung-Yi Lee and Bo-Hsiang Tseng and Tsung-Hsien Wen and Yu Tsao", title = "Personalizing Recurrent-Neural-Network-Based Language Model by Social Network", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "519--530", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2635445", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ming:2017:SEB, author = "Ji Ming and Danny Crookes", title = "Speech Enhancement Based on Full-Sentence Correlation and Clean Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "531--543", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2651406", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Do:2017:PWL, author = "Quoc Truong Do and Tomoki Toda and Graham Neubig and Sakriani Sakti and Satoshi Nakamura", title = "Preserving Word-Level Emphasis in Speech-to-Speech Translation", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "544--556", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2643280", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2017:CPT, author = "Zhenghua Li and Jiayuan Chao and Min Zhang and Wenliang Chen and Meishan Zhang and Guohong Fu", title = "Coupled {POS} Tagging on Heterogeneous Annotations", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "557--571", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2644262", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Doire:2017:SCO, author = "Clement S. J. Doire and Mike Brookes and Patrick A. Naylor and Christopher M. Hicks and Dave Betts and Mohammad A. Dmour and S{\o}ren Holdt Jensen", title = "Single-Channel Online Enhancement of Speech Corrupted by Reverberation and Noise", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "572--587", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2641904", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sizov:2017:DOD, author = "Aleksandr Sizov and Kong Aik Lee and Tomi Kinnunen", title = "Direct Optimization of the Detection Cost for {$I$}-Vector-Based Spoken Language Recognition", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "588--597", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2651377", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sheikh:2017:MSC, author = "Imran Sheikh and Dominique Fohr and Irina Illina and Georges Linar{\`e}s", title = "Modelling Semantic Context of {OOV} Words in Large Vocabulary Continuous Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "598--610", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2651361", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Farmani:2017:ISS, author = "Mojtaba Farmani and Michael Syskind Pedersen and Zheng-Hua Tan and Jesper Jensen", title = "Informed Sound Source Localization Using Relative Transfer Functions for Hearing Aid Applications", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "611--623", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2651373", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Vikram:2017:EET, author = "C. M. Vikram and S. R. Mahadeva Prasanna", title = "Epoch Extraction From Telephone Quality Speech Using Single Pole Filter", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "624--636", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2651391", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Omachi:2017:AMM, author = "Motoi Omachi and Tetsuji Ogawa and Tetsunori Kobayashi", title = "Associative Memory Model-Based Linear Filtering and Its Application to Tandem Connectionist Blind Source Separation", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "637--650", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2653941", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cherkassky:2017:BSW, author = "Dani Cherkassky and Sharon Gannot", title = "Blind Synchronization in Wireless Acoustic Sensor Networks", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "651--661", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2655259", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Girin:2017:ECG, author = "Laurent Girin and Thomas Hueber and Xavier Alameda-Pineda", title = "Extending the Cascaded {Gaussian} Mixture Regression Framework for Cross-Speaker Acoustic-Articulatory Mapping", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "662--673", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2651398", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bahari:2017:BSR, author = "Mohamad Hasan Bahari and Alexander Bertrand and Marc Moonen", title = "Blind Sampling Rate Offset Estimation for Wireless Acoustic Sensor Networks Through Weighted Least-Squares Coherence Drift Estimation", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "674--686", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2647713", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kuklasinski:2017:CML, author = "Adam Kuklasi{\'n}ski and Simon Doclo and S{\o}ren Holdt Jensen and Jesper Jensen", title = "Correction to {``Maximum Likelihood PSD Estimation for Speech Enhancement in Reverberation and Noise''}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "3", pages = "687--687", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2649958", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Feb 25 09:40:47 MST 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", note = "See \cite{Cui:2016:MLN}.", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCg, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "688--689", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2684683", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCh, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "690--691", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2684681", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gannot:2017:CPM, author = "Sharon Gannot and Emmanuel Vincent and Shmulik Markovich-Golan and Alexey Ozerov", title = "A Consolidated Perspective on Multimicrophone Speech Enhancement and Source Separation", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "692--730", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2647702", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7805139/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ying:2017:WDS, author = "Dongwen Ying and Ruohua Zhou and Junfeng Li and Yonghong Yan", title = "Window-Dominant Signal Subspace Methods for Multiple Short-Term Speech Source Localization", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "731--744", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2625458", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7736102/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wood:2017:BSS, author = "Sean U. N. Wood and Jean Rouat and St{\'e}phane Dupont and Gueorgui Pironkov", title = "Blind Speech Separation and Enhancement With {GCC-NMF}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "745--755", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2656805", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7828077/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Spille:2017:CBC, author = "Constantin Spille and Birger Kollmeier and Bernd T. Meyer", title = "Combining Binaural and Cortical Features for Robust Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "756--767", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2661712", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7837638/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Koizumi:2017:IAF, author = "Yuma Koizumi and Kenta Niwa and Yusuke Hioka and Kazunori Kobayashi and Hitoshi Ohmuro", title = "Informative Acoustic Feature Selection to Maximize Mutual Information for Collecting Target Sources", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "768--779", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2662232", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7839197/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Higuchi:2017:OMB, author = "Takuya Higuchi and Nobutaka Ito and Shoko Araki and Takuya Yoshioka and Marc Delcroix and Tomohiro Nakatani", title = "Online {MVDR} Beamformer Based on Complex {Gaussian} Mixture Model With Spatial Prior for Noise Robust {ASR}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "780--793", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2665341", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7845594/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nakamura:2017:RTP, author = "Eita Nakamura and Kazuyoshi Yoshii and Shigeki Sagayama", title = "Rhythm Transcription of Polyphonic Piano Music Based on Merged-Output {HMM} for Multiple Voices", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "794--806", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2662479", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7839215/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ghahabi:2017:DLB, author = "Omid Ghahabi and Javier Hernando", title = "Deep Learning Backend for Single and Multisession $i$-Vector Speaker Recognition", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "807--817", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2661705", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7847321/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Karanasou:2017:VSN, author = "Penny Karanasou and Chunyang Wu and Mark Gales and Philip C. Woodland", title = "{$I$}-Vectors and Structured Neural Networks for Rapid Adaptation of Acoustic Models", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "818--828", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2670141", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7857716/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Aneeja:2017:EFF, author = "G. Aneeja and B. Yegnanarayana", title = "Extraction of Fundamental Frequency From Degraded Speech Using Temporal Envelopes at High {SNR} Frequencies", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "829--838", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2666425", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7847347/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sarfjoo:2017:UEN, author = "Seyyed Saeed Sarfjoo and Cenk Demiro{\u{g}}lu and Simon King", title = "Using Eigenvoices and Nearest-Neighbors in {HMM}-Based Cross-Lingual Speaker Adaptation With Limited Data", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "839--851", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2667880", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7851067/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2017:BNR, author = "Yung-Yue Chen and Jia-Hao Zhang", title = "Background Noise Reduction Design for Dual Microphone Cellular Phones: Robust Approach", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "852--862", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2572259", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7478101/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2017:IWR, author = "Liner Yang and Xinxiong Chen and Zhiyuan Liu and Maosong Sun", title = "Improving Word Representations with Document Labels", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "863--870", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2658019", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7833113/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2017:NNS, author = "Shiliang Zhang and Cong Liu and Hui Jiang and Si Wei and Lirong Dai and Yu Hu", title = "Nonrecurrent Neural Structure for Long-Term Dependence", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "871--884", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2672398", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7859324/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2017:TIF, author = "Xuefeng Yang and Kezhi Mao", title = "Task Independent Fine Tuning for Word Embeddings", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "885--894", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2644863", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7797241/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bao:2017:DRB, author = "Yu Bao and Huawei Chen", title = "Design of Robust Broadband Beamformers Using Worst-Case Performance Optimization: a Semidefinite Programming Approach", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "895--907", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2674968", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7864329/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cumani:2017:NVT, author = "Sandro Cumani and Pietro Laface", title = "Nonlinear {I}-Vector Transformations for {PLDA}-Based Speaker Recognition", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "908--919", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2674966", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7864395/", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IATb, author = "Anonymous", title = "{IEEE\slash} {ACM} Transactions on Audio, Speech, and Language Processing Edics", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "920--921", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2684712", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ITA, author = "Anonymous", title = "{IEEE} Transactions on Audio, Speech, and Language Processing information for authors", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "922--923", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2684714", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IICb, author = "Anonymous", title = "Introducing {IEEE Collabratec}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "924", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2684717", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:FCb, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "C1", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2684721", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPb, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "C2", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2684723", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPc, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "C3", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2684725", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:BPa, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "25", number = "4", pages = "C4", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2684727", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Mon Jul 24 18:45:09 MDT 2017", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCi, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "925--926", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2684687", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCj, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "927--928", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2684689", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Airaksinen:2017:QPA, author = "Manu Airaksinen and Tom B{\"a}ckstr{\"o}m and Paavo Alku", title = "Quadratic Programming Approach to Glottal Inverse Filtering by Joint Norm-1 and Norm-2 Optimization", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "929--939", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2620718", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7636994/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schwartz:2017:MLB, author = "Ofer Schwartz and Sharon Gannot and Emanu{\"e}l A. P. Habets", title = "Multispeaker {LCMV} Beamformer and Postfilter for Source Separation and Noise Reduction", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "940--951", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2655258", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7842601/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2017:RHF, author = "Dongmei Wang and Chengzhu Yu and John H. L. Hansen", title = "Robust Harmonic Features for Classification-Based Pitch Estimation", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "952--964", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2667879", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7851049/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sainath:2017:MSP, author = "Tara N. Sainath and Ron J. Weiss and Kevin W. Wilson and Bo Li and Arun Narayanan and Ehsan Variani and Michiel Bacchiani and Izhak Shafran and Andrew Senior and Kean Chin and Ananya Misra and Chanwoo Kim", title = "Multichannel Signal Processing With Deep Neural Networks for Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "965--979", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2672401", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7859320/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Khalilian:2017:SST, author = "Hanieh Khalilian and Ivan V. Baji{\'c} and Rodney G. Vaughan", title = "A Simulation Study of a Three-Dimensional Sound Field Reproduction System for Immersive Communication", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "980--995", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2674971", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7864381/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Franck:2017:SOM, author = "Andreas Franck and Wenwu Wang and Filippo Maria Fazi", title = "Sparse $ \ell_1$-Optimal Multiloudspeaker Panning and Its Relation to Vector Base Amplitude Panning", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "996--1010", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2674975", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7864372/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2017:SQS, author = "Songbin Li and Yizhen Jia and C.-C. Jay Kuo", title = "Steganalysis of {QIM} Steganography in Low-Bit-Rate Speech Signals", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1011--1022", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2676356", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/cryptography2010.bib; https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7867798/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kanda:2017:MPB, author = "Naoyuki Kanda and Xugang Lu and Hisashi Kawai", title = "Maximum-a-Posteriori-Based Decoding for End-to-End Acoustic Models", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1023--1034", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2678162", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7870575/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shokouhi:2017:TKE, author = "Navid Shokouhi and John H. L. Hansen", title = "{Teager--Kaiser} Energy Operators for Overlapped Speech Detection", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1035--1047", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2678684", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7872488/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Huang:2017:PSS, author = "Yi-Chin Huang and Chung-Hsien Wu and Yan-You Chen and Ming-Ge Shie and Jhing-Fa Wang", title = "Personalized Spontaneous Speech Synthesis Using a Small-Sized Unsegmented Semispontaneous Speech", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1048--1060", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2679603", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7874173/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Park:2017:ECD, author = "Jeongsoo Park and Jaeyoung Shin and Kyogu Lee", title = "Exploiting Continuity\slash Discontinuity of Basis Vectors in Spectrogram Decomposition for Harmonic-Percussive Sound Separation", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1061--1074", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2681742", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7876808/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2017:DLB, author = "Xueliang Zhang and DeLiang Wang", title = "Deep Learning Based Binaural Speech Separation in Reverberant Environments", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1075--1084", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2687104", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7886357/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Delfarah:2017:FMB, author = "Masood Delfarah and DeLiang Wang", title = "Features for Masking-Based Monaural Speech Separation in Reverberant Conditions", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1085--1094", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2687829", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7887742/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2017:SCA, author = "Feiran Yang and Gerald Enzner and Jun Yang", title = "Statistical Convergence Analysis for Optimal Control of {DFT}-Domain Adaptive Echo Canceler", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1095--1106", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2671422", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7858641/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nose:2017:SSB, author = "Takashi Nose and Yusuke Arao and Takao Kobayashi and Komei Sugiura and Yoshinori Shiga", title = "Sentence Selection Based on Extended Entropy Using Phonetic and Prosodic Contexts for Statistical Parametric Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1107--1116", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2688585", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7888524/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Firtha:2017:IRS, author = "Gergely Firtha and P{\'e}ter Fiala and Frank Schultz and Sascha Spors", title = "Improved Referencing Schemes for {2.5D} Wave Field Synthesis Driving Functions", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1117--1127", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2689245", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7888944/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Maestre:2017:JMB, author = "Esteban Maestre and Gary P. Scavone and Julius O. Smith", title = "Joint Modeling of Bridge Admittance and Body Radiativity for Efficient Synthesis of String Instrument Sound by Digital Waveguides", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1128--1139", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2689241", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7888993/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Huang:2017:DFI, author = "Gongping Huang and Jacob Benesty and Jingdong Chen", title = "On the Design of Frequency-Invariant Beampatterns With Uniform Circular Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1140--1153", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2689681", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7890381/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Prusa:2017:NMR, author = "Zden{\v{e}}k Pr{\r{u}}{\v{s}}a and Peter Balazs and Peter Lempel S{\o}ndergaard", title = "A Noniterative Method for Reconstruction of Phase From {STFT} Magnitude", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1154--1164", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2678166", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7890450/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IATc, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1167--1168", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2705590", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IATd, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} for authors", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1169--1170", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2705594", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:OAa, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1171", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2707041", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IICc, author = "Anonymous", title = "Introducing {IEEE Collabratec}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1172", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2707020", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:MGMa, author = "Anonymous", title = "{Member Get-A-Member (MGM) Program}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "1173", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2707024", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:BPb, author = "Anonymous", title = "Blank Page", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "B1165--B1166", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2707658", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:FCc, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "C1", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2684719", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPd, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "C2", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2705586", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPe, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "C3", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2705598", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:BPc, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "25", number = "5", pages = "C4", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2705602", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCk, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1167--1168", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2684679", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Richard:2017:ISS, author = "G. Richard and T. Virtanen and J. P. Bello and N. Ono and H. Glotin", title = "Introduction to the Special Section on Sound Scene and Event Analysis", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1169--1171", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2699334", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sanchez-Hevia:2017:MLD, author = "H{\'e}ctor A. S{\'a}nchez-Hevia and David Ayll{\'o}n and Roberto Gil-Pita and Manuel Rosa-Zurera", title = "Maximum Likelihood Decision Fusion for Weapon Classification in Wireless Acoustic Sensor Networks", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1172--1182", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690579", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933058/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Koluguri:2017:SEU, author = "Nithin Rao Koluguri and G. Nisha Meenakshi and Prasanta Kumar Ghosh", title = "Spectrogram Enhancement Using {Multiple Window Savitzky--Golay (MWSG)} Filter for Robust Bird Sound Detection", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1183--1192", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690562", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933047/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Stowell:2017:BSR, author = "Dan Stowell and Emmanouil Benetos and Lisa F. Gill", title = "On-Bird Sound Recordings: Automatic Acoustic Recognition of Activities and Contexts", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1193--1206", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690565", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933044/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Carroll:2017:OLA, author = "Brandon T. Carroll and Bradley M. Whitaker and Wayne Dayley and David V. Anderson", title = "Outlier Learning via Augmented Frozen Dictionaries", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1207--1215", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690567", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933057/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bisot:2017:FLM, author = "Victor Bisot and Romain Serizel and Slim Essid and Ga{\"e}l Richard", title = "Feature Learning With Matrix Factorization Applied to Acoustic Scene Classification", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1216--1229", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690570", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933045/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2017:UFL, author = "Yong Xu and Qiang Huang and Wenwu Wang and Peter Foster and Siddharth Sigtia and Philip J. B. Jackson and Mark D. Plumbley", title = "Unsupervised Feature Learning Based on Deep Models for Environmental Audio Tagging", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1230--1241", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690563", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933054/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Grzeszick:2017:BFM, author = "Ren{\'e} Grzeszick and Axel Plinge and Gernot A. Fink", title = "Bag-of-Features Methods for Acoustic Event Detection and Classification", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1242--1252", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690574", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933055/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rakotomamonjy:2017:SRL, author = "Alain Rakotomamonjy", title = "Supervised Representation Learning for Audio Scene Classification", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1253--1265", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690561", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933051/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Benetos:2017:PSE, author = "Emmanouil Benetos and Gr{\'e}goire Lafay and Mathieu Lagrange and Mark D. Plumbley", title = "Polyphonic Sound Event Tracking Using Linear Dynamical Systems", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1266--1277", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690576", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933041/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Phan:2017:IAS, author = "Huy Phan and Lars Hertel and Marco Maass and Philipp Koch and Radoslaw Mazur and Alfred Mertins", title = "Improved Audio Scene Classification Based on Label-Tree Embeddings and Convolutional Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1278--1290", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690564", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933052/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{r:2017:CRN, author = "Emre {\c{C}}ak\i r and Giambattista Parascandolo and Toni Heittola and Heikki Huttunen and Tuomas Virtanen", title = "Convolutional Recurrent Neural Networks for Polyphonic Sound Event Detection", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1291--1303", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690575", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933050/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schroder:2017:CAA, author = "Jens Schr{\"o}der and Niko Moritz and J{\"o}rn Anem{\"u}ller and Stefan Goetze and Birger Kollmeier", title = "Classifier Architectures for Acoustic Scenes and Events: Implications for {DNNs}, {TDNNs}, and Perceptual Features from {DCASE} 2016", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1304--1314", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690569", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933048/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2017:CTF, author = "Wenjun Yang and Sridhar Krishnan", title = "Combining Temporal Features by Local Binary Pattern for Acoustic Scene Classification", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1315--1321", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690558", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933046/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dov:2017:MKM, author = "David Dov and Ronen Talmon and Israel Cohen", title = "Multimodal Kernel Method for Activity Detection of Sound Sources", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1322--1334", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690568", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933049/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Imoto:2017:SCS, author = "Keisuke Imoto and Nobutaka Ono", title = "Spatial Cepstrum as a Spatial Feature Using a Distributed Microphone Array for Acoustic Scene Analysis", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1335--1343", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690559", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933053/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Trowitzsch:2017:RDE, author = "Ivo Trowitzsch and Johannes Mohr and Youssef Kashef and Klaus Obermayer", title = "Robust Detection of Environmental Sounds in Binaural Auditory Scenes", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1344--1356", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2690573", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7933059/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jameel:2017:NRF, author = "Abu Shafin Mohammad Mahdee Jameel and Shaikh Anowarul Fattah and Rajib Goswami and Wei-Ping Zhu and M. Omair Ahmad", title = "Noise Robust Formant Frequency Estimation Method Based on Spectral Model of Repeated Autocorrelation of Speech", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1357--1370", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2016.2625423", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7736088/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2017:DDM, author = "Na Li and Man-Wai Mak and Jen-Tzung Chien", title = "{DNN}-Driven Mixture of {PLDA} for Robust Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1371--1383", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2692304", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7894162/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2017:SIB, author = "Kai Wu and Vaninirappuputhenpurayil Gopalan Reju and Andy W. H. Khong and Shu Ting Goh", title = "Swarm Intelligence Based Particle Filter for Alternating Talker Localization and Tracking Using Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1384--1397", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2693566", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7898417/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IATe, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1398--1399", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2705592", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IATf, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} for authors", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1400--1401", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2705596", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:OAb, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1402", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2707022", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IICd, author = "Anonymous", title = "Introducing {IEEE Collabratec}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1403", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2707039", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:MGMb, author = "Anonymous", title = "{Member Get-A-Member (MGM) Program}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "1404", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2707026", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:FCd, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "C1", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2706239", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPf, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "C2", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2705588", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPg, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "C3", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2705600", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:BPd, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "25", number = "6", pages = "C4", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2705604", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCl, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1405--1406", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2717120", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCEa, author = "Anonymous", title = "Table of Contents Edics", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1407--1408", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2717126", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2017:CTM, author = "Yu-An Chen and Ju-Chiang Wang and Yi-Hsuan Yang and Homer H. Chen", title = "Component Tying for Mixture Model Adaptation in Personalization of Music Emotion Recognition", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1409--1420", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2693565", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7898399/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zeinali:2017:HBP, author = "Hossein Zeinali and Hossein Sameti and Luk{\'a}{\v{s}} Burget", title = "{HMM}-Based Phrase-Independent $i$-Vector Extractor for Text-Dependent Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1421--1435", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2694708", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7902120/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2017:TDF, author = "Xinzhou Xu and Jun Deng and Nicholas Cummins and Zixing Zhang and Chen Wu and Li Zhao and Bj{\"o}rn Schuller", title = "A Two-Dimensional Framework of Multiple Kernel Subspace Learning for Recognizing Emotion in Speech", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1436--1449", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2694704", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7902189/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Korpusik:2017:SLU, author = "Mandy Korpusik and James Glass", title = "Spoken Language Understanding for a Nutrition Dialogue System", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1450--1461", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2694699", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7902155/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fakhry:2017:ASS, author = "Mahmoud Fakhry and Piergiorgio Svaizer and Maurizio Omologo", title = "Audio Source Separation in Reverberant Environments Using $ \beta $-Divergence-Based Nonnegative Factorization", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1462--1476", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2695718", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7904611/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Laufer-Goldshtein:2017:SSS, author = "Bracha Laufer-Goldshtein and Ronen Talmon and Sharon Gannot", title = "Semi-Supervised Source Localization on Multiple Manifolds With Distributed Microphones", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1477--1491", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2696310", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7906609/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Williamson:2017:TFM, author = "Donald S. Williamson and DeLiang Wang", title = "Time-Frequency Masking in the Complex Domain for Speech Dereverberation and Denoising", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1492--1501", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2696307", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7906509/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lu:2017:SFH, author = "Liang Lu and Steve Renals", title = "Small-Footprint Highway Deep Neural Networks for Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1502--1511", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2698723", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7913606/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kodrasi:2017:SDP, author = "Ina Kodrasi and Simon Doclo", title = "Signal-Dependent Penalty Functions for Robust Acoustic Multi-Channel Equalization", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1512--1525", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2699326", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7914695/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kim:2017:DIW, author = "Jung-Hee Kim and Jin Kim and Jae Hyeon Jeon and Sang Won Nam", title = "Delayless Individual-Weighting-Factors Sign Subband Adaptive Filter With Band-Dependent Variable Step-Sizes", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1526--1534", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2699325", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7914653/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2017:GMD, author = "Yannan Wang and Jun Du and Li-Rong Dai and Chin-Hui Lee", title = "A Gender Mixture Detection Approach to Unsupervised Single-Channel Speech Separation Based on Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1535--1546", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2700540", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7917323/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Vairetti:2017:SAP, author = "Giacomo Vairetti and Enzo {De Sena} and Michael Catrysse and S{\o}ren Holdt Jensen and Marc Moonen and Toon van Waterschoot", title = "A Scalable Algorithm for Physically Motivated and Sparse Approximation of Room Impulse Responses With Orthonormal Basis Functions", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1547--1561", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2700940", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7918506/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IATg, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1562--1563", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725100", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ITMb, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1564--1565", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725102", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:OAc, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1566", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725159", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IICe, author = "Anonymous", title = "Introducing {IEEE Collabratec}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "1567", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725161", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:FCe, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "C1", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725679", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPh, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "C2", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725123", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPi, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "C3", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725109", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:BPe, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "25", number = "7", pages = "C4", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725111", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:30 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCm, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1562--1563", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725119", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCn, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1564--1565", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725121", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Stevens:2017:MSR, author = "Francis Stevens and Damian T. Murphy and Lauri Savioja and Vesa V{\"a}lim{\"a}ki", title = "Modeling Sparsely Reflecting Outdoor Acoustic Scenes Using the Waveguide {Web}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1566--1578", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2699424", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7918519/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Olivieri:2017:GPS, author = "Ferdinando Olivieri and Filippo Maria Fazi and Simone Fontana and Dylan Menzies and Philip Arthur Nelson", title = "Generation of Private Sound With a Circular Loudspeaker Array and the Weighted Pressure Matching Method", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1579--1591", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2700945", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7918631/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Elshamy:2017:IPS, author = "Samy Elshamy and Nilesh Madhu and Wouter Tirry and Tim Fingscheidt", title = "Instantaneous A Priori {SNR} Estimation by Cepstral Excitation Manipulation", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1592--1605", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2702385", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7922539/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Alku:2017:LPM, author = "Paavo Alku and Rahim Saeidi", title = "The Linear Predictive Modeling of Speech From Higher-Lag Autocorrelation Coefficients Applied to Noise-Robust Speaker Recognition", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1606--1617", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2703165", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7924356/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pang:2017:BSL, author = "Cheng Pang and Hong Liu and Jie Zhang and Xiaofei Li", title = "Binaural Sound Localization Based on Reverberation Weighting and Generalized Parametric Mapping", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1618--1632", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2703650", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7926345/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pradhan:2017:IPD, author = "Somanath Pradhan and Vinal Patel and Dipen Somani and Nithin V. George", title = "An Improved Proportionate Delayless Multiband-Structured Subband Adaptive Feedback Canceller for Digital Hearing Aids", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1633--1643", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2705346", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7931717/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Drgas:2017:BNN, author = "Szymon Drgas and Tuomas Virtanen and J{\"o}rg L{\"u}cke and Antti Hurmalainen", title = "Binary Non-Negative Matrix Deconvolution for Audio Dictionary Learning", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1644--1656", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2709909", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7935444/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Saki:2017:RTU, author = "Fatemeh Saki and Nasser Kehtarnavaz", title = "Real-Time Unsupervised Classification of Environmental Noise Signals", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1657--1667", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2711059", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7937831/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kaushik:2017:ASD, author = "Lakshmish Kaushik and Abhijeet Sangwan and John H. L. Hansen", title = "Automatic Sentiment Detection in Naturalistic Audio", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1668--1679", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2678164", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7870612/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schwartz:2017:CRB, author = "Ofer Schwartz and Sharon Gannot and Emanu{\"e}l A. P. Habets", title = "{Cram{\'e}r--Rao} Bound Analysis of Reverberation Level Estimators for Dereverberation and Noise Reduction", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1680--1693", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2696308", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7906601/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Khademi:2017:IEB, author = "Seyran Khademi and Richard C. Hendriks and W. Bastiaan Kleijn", title = "Intelligibility Enhancement Based on Mutual Information", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1694--1708", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2714424", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7946152/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hatano:2017:CND, author = "Yuta Hatano and Chuang Shi and Yoshinobu Kajikawa", title = "Compensation for Nonlinear Distortion of the Frequency Modulation-Based Parametric Array Loudspeaker", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1709--1717", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2705280", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7930484/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chien:2017:EGI, author = "Yu-Ren Chien and Daryush D. Mehta and J{\'o}n Gu{\eth}nason and Mat{\'\i}as Za{\~n}artu and Thomas F. Quatieri", title = "Evaluation of Glottal Inverse Filtering Algorithms Using a Physiologically Based Articulatory Speech Synthesizer", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1718--1730", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2714839", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7946161/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IATh, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1731--1732", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725719", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ITMc, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1733--1734", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725104", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:OAd, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1735", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725106", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IICf, author = "Anonymous", title = "Introducing {IEEE Collabratec}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "1736", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725165", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:FCf, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "C1", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725681", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPj, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "C2", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725125", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPk, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "C3", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725167", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:BPf, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "25", number = "8", pages = "C4", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725169", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCo, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1737--1738", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2743659", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCp, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1739--1740", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2743661", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Abesser:2017:ICM, author = "Jakob Abe{\ss}er and Gerald Schuller", title = "Instrument-Centered Music Transcription of Solo Bass Guitar Recordings", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1741--1750", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2702384", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7921692/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{LeCornu:2017:GIA, author = "Thomas {Le Cornu} and Ben Milner", title = "Generating Intelligible Audio Speech From Visual Speech", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1751--1761", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2716178", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7949073/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2017:TQE, author = "Lemao Liu and Atsushi Fujita and Masao Utiyama and Andrew Finch and Eiichiro Sumita", title = "Translation Quality Estimation Using Only Bilingual Corpora", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1762--1772", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2716195", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7949019/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Grais:2017:TSS, author = "Emad M. Grais and Gerard Roma and Andrew J. R. Simpson and Mark D. Plumbley", title = "Two-Stage Single-Channel Audio Source Separation Using Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1773--1783", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2716443", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7951020/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bernardi:2017:AFC, author = "Giuliano Bernardi and Toon van Waterschoot and Jan Wouters and Marc Moonen", title = "Adaptive Feedback Cancellation Using a Partitioned-Block Frequency-Domain {Kalman} Filter Approach With {PEM}-Based Signal Prewhitening", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1784--1798", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2716188", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7949026/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Patel:2017:MPS, author = "Vinal Patel and Jordan Cheer and Nithin V. George", title = "Modified Phase-Scheduled-Command {FxLMS} Algorithm for Active Sound Profiling", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1799--1808", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2717499", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7953648/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Janod:2017:DBF, author = "Killian Janod and Mohamed Morchid and Richard Dufour and Georges Linar{\`e}s and Renato {De Mori}", title = "Denoised Bottleneck Features From Deep Autoencoders for Telephone Conversation Analysis", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1809--1820", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2718843", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7954983/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Stefanakis:2017:PCS, author = "Nikolaos Stefanakis and Despoina Pavlidi and Athanasios Mouchtaris", title = "Perpendicular Cross-Spectra Fusion for Sound Source Localization With a Planar Microphone Array", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1821--1835", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2718733", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", note = "See corrections \cite{Stefanakis:2017:CPC}.", URL = "http://ieeexplore.ieee.org/document/7955064/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yoshimura:2017:SOM, author = "Takenori Yoshimura and Kei Hashimoto and Keiichiro Oura and Yoshihiko Nankaku and Keiichi Tokuda", title = "Simultaneous Optimization of Multiple Tree-Based Factor Analyzed {HMM} for Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1836--1845", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2721219", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7961246/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nakamura:2017:NVR, author = "Eita Nakamura and Kazuyoshi Yoshii and Simon Dixon", title = "Note Value Recognition for Piano Transcription Using {Markov} Random Fields", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1846--1858", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2722103", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7964741/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IATi, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1859--1860", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2754183", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ITMd, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1861--1862", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2754185", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:OAe, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "1863", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2707043", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:FCg, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "C1", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2754179", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPl, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "C2", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2754181", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPm, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "C3", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2754187", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:BPg, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "25", number = "9", pages = "C4", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2754189", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:31 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCq, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "1859--1860", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2754203", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCr, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "1861--1862", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2754205", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tian:2017:EBA, author = "Xiaohai Tian and Siu Wa Lee and Zhizheng Wu and Eng Siong Chng and Haizhou Li", title = "An Exemplar-Based Approach to Frequency Warping for Voice Conversion", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "1863--1876", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2723721", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7968404/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2017:IME, author = "Siying Wang and Sebastian Ewert and Simon Dixon", title = "Identifying Missing and Extra Notes in Piano Recordings Using Score-Informed Dictionary Learning", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "1877--1889", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2724203", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7971931/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cumani:2017:JEP, author = "Sandro Cumani and Pietro Laface", title = "Joint Estimation of {PLDA} and Nonlinear Transformations of Speaker Vectors", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "1890--1900", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2724198", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7971950/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kolbaek:2017:MSS, author = "Morten Kolb{\ae}k and Dong Yu and Zheng-Hua Tan and Jesper Jensen", title = "Multitalker Speech Separation With Utterance-Level Permutation Invariant Training of Deep Recurrent Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "1901--1913", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2726762", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7979557/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chung:2017:UID, author = "Cheng-Tao Chung and Cheng-Yu Tsai and Chia-Hsiang Liu and Lin-Shan Lee", title = "Unsupervised Iterative Deep Learning of Speech Features and Acoustic Tokens with Applications to Spoken Term Detection", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "1914--1928", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2729024", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7984872/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Antonello:2017:RIR, author = "Niccol{\`o} Antonello and Enzo {De Sena} and Marc Moonen and Patrick A. Naylor and Toon van Waterschoot", title = "Room Impulse Response Interpolation Using a Sparse Spatio-Temporal Representation of the Sound Field", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "1929--1941", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2730284", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7987742/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qian:2017:DFE, author = "Yanmin Qian and Nanxin Chen and Heinrich Dinkel and Zhizheng Wu", title = "Deep Feature Engineering for Noise Robust Spoofing Detection", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "1942--1955", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2732162", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7993036/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hafezi:2017:AIV, author = "Sina Hafezi and Alastair H. Moore and Patrick A. Naylor", title = "Augmented Intensity Vectors for Direction of Arrival Estimation in the Spherical Harmonic Domain", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "1956--1968", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2736067", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8002621/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jo:2017:SHS, author = "Byeongho Jo and Jung-Woo Choi", title = "Spherical Harmonic Smoothing for Localizing Coherent Sound Sources", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "1969--1984", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2738698", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8008781/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jokinen:2017:IET, author = "Emma Jokinen and Ulpu Remes and Paavo Alku", title = "Intelligibility Enhancement of Telephone Speech Using {Gaussian} Process Regression for Normal-to-Lombard Spectral Tilt Conversion", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "1985--1996", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2740004", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8010472/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2017:MSL, author = "Xiaofei Li and Laurent Girin and Radu Horaud and Sharon Gannot", title = "Multiple-Speaker Localization Based on Direct-Path Features and Likelihood Maximization With Spatial Sparsity Regularization", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "1997--2012", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2740001", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8010441/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Arnela:2017:FES, author = "Marc Arnela and Oriol Guasch", title = "Finite Element Synthesis of Diphthongs Using Tuned Two-Dimensional Vocal Tracts", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "2013--2023", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2735179", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8000370/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Baby:2017:JDD, author = "Deepak Baby and Hugo {Van hamme}", title = "Joint Denoising and Dereverberation Using Exemplar-Based Sparse Representations and Decaying Norm Constraint", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "2024--2035", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2744261", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8016372/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IATj, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "2036--2037", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2754207", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ITMe, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "2038--2039", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2754209", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:OAf, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "2040", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2725163", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:FCh, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "C1", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2754199", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPn, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "C2", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2754201", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPo, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "C3", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2754211", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:BPh, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "25", number = "10", pages = "C4", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2754213", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCs, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2041--2042", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2766999", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCt, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2043--2044", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2767001", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Huang:2017:TSD, author = "Qinghua Huang and Lin Zhang and Yong Fang", title = "Two-Stage Decoupled {DOA} Estimation Based on Real Spherical Harmonics for Spherical Arrays", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2045--2058", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2737235", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8003459/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hayashi:2017:DCL, author = "Tomoki Hayashi and Shinji Watanabe and Tomoki Toda and Takaaki Hori and Jonathan {Le Roux} and Kazuya Takeda", title = "Duration-Controlled {LSTM} for Polyphonic Sound Event Detection", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2059--2070", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2740002", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8010445/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pal:2017:SMU, author = "Monisankha Pal and Goutam Saha", title = "Spectral Mapping Using Prior Re-Estimation of $i$-Vectors and System Fusion for Voice Conversion", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2071--2084", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2743620", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8015184/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Enarvi:2017:ASR, author = "Seppo Enarvi and Peter Smit and Sami Virpioja and Mikko Kurimo", title = "Automatic Speech Recognition With Very Large Conversational {Finnish} and {Estonian} Vocabularies", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2085--2097", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2743344", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8015196/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Muckenhirn:2017:LTS, author = "Hannah Muckenhirn and Pavel Korshunov and Mathew Magimai-Doss and S{\'e}bastien Marcel", title = "Long-Term Spectral Statistics for Voice Presentation Attack Detection", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2098--2111", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2743340", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8015145/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hamilton:2017:FMD, author = "Brian Hamilton and Stefan Bilbao", title = "{FDTD} Methods for {$3$-D} Room Acoustics Simulation With High-Order Accuracy in Space and Time", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2112--2124", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2744799", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8016655/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mowlaee:2017:NRM, author = "Pejman Mowlaee and Martin Blass and W. Bastiaan Kleijn", title = "New Results in Modulation-Domain Single-Channel Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2125--2137", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2747082", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8022920/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Menzies:2017:DCC, author = "Dylan Menzies and Filippo Maria Fazi", title = "Decoding and Compression of Channel and Scene Objects for Spatial Audio", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2138--2151", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2744264", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8016390/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Song:2017:ESE, author = "Eunwoo Song and Frank K. Soong and Hong-Goo Kang", title = "Effective Spectral and Excitation Modeling Techniques for {LSTM--RNN}-Based Speech Synthesis Systems", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2152--2161", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2746264", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8017571/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sharma:2017:DSR, author = "Pulkit Sharma and Vinayak Abrol and Anil Kumar Sao", title = "Deep-Sparse-Representation-Based Features for Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2162--2175", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2748240", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8023884/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Natgunanathan:2017:PBM, author = "Iynkaran Natgunanathan and Yong Xiang and Guang Hua and Gleb Beliakov and John Yearwood", title = "Patchwork-Based Multilayer Audio Watermarking", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2176--2187", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2749001", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/cryptography2010.bib; https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8025572/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yu:2017:ALB, author = "Chengzhu Yu and John H. L. Hansen", title = "Active Learning Based Constrained Clustering For Speaker Diarization", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2188--2198", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2747097", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8030331/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ottosen:2017:PVB, author = "Emil Solsb{\ae}k Ottosen and Monika D{\"o}rfler", title = "A Phase Vocoder Based on Nonstationary {Gabor} Frames", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2199--2208", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2750767", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8031036/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schwartz:2017:TMB, author = "Boaz Schwartz and Sharon Gannot and Emanu{\"e}l A. P. Habets", title = "Two Model-Based {EM} Algorithms for Blind Source Separation in Noisy Environments", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2209--2222", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2738438", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8007259/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Taseska:2017:NNP, author = "Maja Taseska and Emanu{\"e}l A. P. Habets", title = "Nonstationary Noise {PSD} Matrix Estimation for Multichannel Blind Speech Extraction", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2223--2236", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2750239", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8030098/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{DiGiorgi:2017:DDM, author = "Bruno {Di Giorgi} and Simon Dixon and Massimiliano Zanoni and Augusto Sarti", title = "A Data-Driven Model of Tonal Chord Sequence Complexity", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2237--2250", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2756443", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8049362/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Stefanakis:2017:CPC, author = "N. Stefanakis and D. Pavlidi and A. Mouchtaris", title = "Corrections to {``Perpendicular Cross-Spectra Fusion for Sound Source Localization With a Planar Microphone Array'' [Sep 17 1821--1835]}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2251", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2763038", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", note = "See \cite{Stefanakis:2017:PCS}.", URL = "http://ieeexplore.ieee.org/document/8082821/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IATk, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2252--2253", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772589", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ITMf, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2254--2255", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772591", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:OAg, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "2256", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2775939", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:FCi, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "C1", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772581", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPp, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "C2", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772583", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPq, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "C3", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772593", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:BPi, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "25", number = "11", pages = "C4", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772595", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:TCu, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2252--2253", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772597", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schultz:2017:ISI, author = "T. Schultz and T. Hueber and D. J. Krusienski and J. S. Brumberg", title = "Introduction to the Special Issue on Biosignal-Based Spoken Communication", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2254--2256", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2768838", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schultz:2017:BBS, author = "Tanja Schultz and Michael Wand and Thomas Hueber and Dean J. Krusienski and Christian Herff and Jonathan S. Brumberg", title = "Biosignal-Based Spoken Communication: a Survey", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2257--2271", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2752365", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114358/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dromey:2017:ELA, author = "Christopher Dromey and Katherine M. Black", title = "Effects of Laryngeal Activity on Articulation", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2272--2280", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2738564", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114361/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Borsky:2017:MNV, author = "Michal Borsky and Daryush D. Mehta and Jarrad H. {Van Stan} and Jon Gudnason", title = "Modal and Nonmodal Voice Quality Classification Using Acoustic and Electroglottographic Features", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2281--2291", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2759002", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114356/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sereshkeh:2017:ECC, author = "Alborz Rezazadeh Sereshkeh and Robert Trott and Aur{\'e}lien Bricout and Tom Chau", title = "{EEG} Classification of Covert Speech Using Regularized Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2292--2300", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2758164", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114360/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sahraeian:2017:CMS, author = "Reza Sahraeian and Dirk {Van Compernolle}", title = "Crosslingual and Multilingual Speech Recognition Based on the Speech Manifold", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2301--2312", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2751747", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114354/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Grozdic:2017:WSR, author = "{\Dbar}or{\dbar}e T. Grozdi{\'c} and Slobodan T. Jovi{\v{c}}i{\'c}", title = "Whispered Speech Recognition Using Deep Denoising Autoencoder and Inverse Filtering", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2313--2322", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2738559", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114355/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kim:2017:SIS, author = "Myungjong Kim and Beiming Cao and Ted Mau and Jun Wang", title = "Speaker-Independent Silent Speech Recognition From Flesh-Point Articulatory Movements Using an {LSTM} Neural Network", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2323--2336", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2758999", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114350/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tobing:2017:ACS, author = "Patrick Lumban Tobing and Kazuhiro Kobayashi and Tomoki Toda", title = "Articulatory Controllable Speech Modification Based on Statistical Inversion and Production Mappings", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2337--2350", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2753583", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114384/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Steiner:2017:STM, author = "Ingmar Steiner and S{\'e}bastien {Le Maguer} and Alexander Hewer", title = "Synthesis of Tongue Motion and Acoustics From Text Using a Multimodal Articulatory Database", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2351--2361", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2756818", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114352/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gonzalez:2017:DSR, author = "Jose A. Gonzalez and Lam A. Cheah and Angel M. Gomez and Phil D. Green and James M. Gilbert and Stephen R. Ell and Roger K. Moore and Ed Holdsworth", title = "Direct Speech Reconstruction From Articulatory Sensor Data by Machine Learning", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2362--2374", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2757263", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114382/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Janke:2017:ESD, author = "Matthias Janke and Lorenz Diener", title = "{EMG}-to-Speech: Direct Generation of Speech From Facial Electromyographic Signals", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2375--2385", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2738568", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114359/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Meltzner:2017:SSR, author = "Geoffrey S. Meltzner and James T. Heaton and Yunbin Deng and Gianluca {De Luca} and Serge H. Roy and Joshua C. Kline", title = "Silent Speech Recognition as an Alternative Communication Device for Persons With Laryngectomy", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2386--2398", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2740000", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114357/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2017:IMA, author = "Fei Chen and Lan Wang and Hui Chen and Gang Peng", title = "Investigations on {Mandarin} Aspiratory Animations Using an Airflow Model", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2399--2409", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2755400", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114353/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xiong:2017:THP, author = "Wayne Xiong and Jasha Droppo and Xuedong Huang and Frank Seide and Michael L. Seltzer and Andreas Stolcke and Dong Yu and Geoffrey Zweig", title = "Toward Human Parity in Conversational Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2410--2423", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2756440", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8049322/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2017:CAR, author = "Biao Zhang and Deyi Xiong and Jinsong Su and Hong Duan", title = "A Context-Aware Recurrent Encoder for Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2424--2432", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2751420", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8031316/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Asaei:2017:PIL, author = "Afsaneh Asaei and Milos Cernak and Herv{\'e} Bourlard", title = "Perceptual Information Loss due to Impaired Speech Production", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2433--2443", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2738445", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8007273/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ma:2017:EDN, author = "Ning Ma and Tobias May and Guy J. Brown", title = "Exploiting Deep Neural Networks and Head Movements for Robust Binaural Localization of Multiple Sources in Reverberant Environments", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2444--2453", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2750760", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8086216/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:LR, author = "Anonymous", title = "List of Reviewers", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2454--2457", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772658", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:IATl, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2458--2459", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772604", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ITMg, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2460--2461", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772606", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:OAh, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2462", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2775923", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:SII, author = "Anonymous", title = "2017 Subject Index {{\booktitle{IEEE Transactions on Applied Superconductivity}}} Vol. 27", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "2463--2488", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2775900", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:FCj, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "C1", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772600", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPr, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "C2", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772602", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:ISPs, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "C3", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772608", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2017:BPj, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "25", number = "12", pages = "C4", month = "????", year = "2017", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772610", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:32 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCa, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "1--2", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772585", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCEa, author = "Anonymous", title = "Table of Contents {[Edics]}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "3--4", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772587", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yee:2018:NRP, author = "Dianna Yee and Homayoun Kamkar-Parsi and Rainer Martin and Henning Puder", title = "A Noise Reduction Postfilter for Binaurally Linked Single-Microphone Hearing Aids Utilizing a Nearby External Microphone", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "5--18", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2727684", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/7987050/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Backstrom:2018:FRD, author = "Tom B{\"a}ckstr{\o}m and Johannes Fischer", title = "Fast Randomization for Distributed Low-Bitrate Coding of Speech and Audio", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "19--30", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2757601", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8052578/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Deng:2018:SAS, author = "Jun Deng and Xinzhou Xu and Zixing Zhang and Sascha Fr{\"u}hholz and Bj{\"o}rn Schuller", title = "Semisupervised Autoencoders for Speech Emotion Recognition", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "31--43", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2759338", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8059872/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sahidullah:2018:RVL, author = "Md. Sahidullah and Dennis Alexander Lehmann Thomsen and Rosa Gonzalez Hautam{\"a}ki and Tomi Kinnunen and Zheng-Hua Tan and Robert Parts and Martti Pitk{\"a}nen", title = "Robust Voice Liveness Detection and Speaker Verification Using Throat Microphones", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "44--56", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2760243", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8060607/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Degottex:2018:LDP, author = "Gilles Degottex and Pierre Lanchantin and Mark Gales", title = "A Log Domain Pulse Model for Parametric Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "57--70", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2761546", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8063442/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Abel:2018:ASB, author = "Johannes Abel and Tim Fingscheidt", title = "Artificial Speech Bandwidth Extension Using Deep Neural Networks for Wideband Spectral Envelope Estimation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "71--83", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2761236", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8063328/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Saito:2018:SPS, author = "Yuki Saito and Shinnosuke Takamichi and Hiroshi Saruwatari", title = "Statistical Parametric Speech Synthesis Incorporating Generative Adversarial Networks", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "84--96", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2761547", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8063435/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Andersen:2018:RSD, author = "Kristian Timm Andersen and Marc Moonen", title = "Robust Speech-Distortion Weighted Interframe {Wiener} Filters for Single-Channel Noise Reduction", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "97--107", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2761699", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8063896/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chiang:2018:CDA, author = "Chen-Yu Chiang", title = "Cross-Dialect Adaptation Framework for Constructing Prosodic Models for {Chinese} Dialect Text-to-Speech Systems", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "108--121", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2762432", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8066318/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2018:COU, author = "Bingquan Liu and Zhen Xu and Chengjie Sun and Baoxun Wang and Xiaolong Wang and Derek F. Wong and Min Zhang", title = "Content-Oriented User Modeling for Personalized Response Ranking in Chatbots", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "122--133", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2763243", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8068225/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tang:2018:PTN, author = "Zhiyuan Tang and Dong Wang and Yixiang Chen and Lantian Li and Andrew Abel", title = "Phonetic Temporal Neural Model for Language Identification", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "134--144", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2764271", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8070977/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chakrabarty:2018:BAI, author = "Soumitro Chakrabarty and Emanu{\"e}l A. P. Habets", title = "A {Bayesian} Approach to Informed Spatial Filtering With Robustness Against {DOA} Estimation Errors", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "145--160", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2752364", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8167179/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2018:IDF, author = "Kuan-Yu Chen and Shih-Hung Liu and Berlin Chen and Hsin-Min Wang", title = "An Information Distillation Framework for Extractive Summarization", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "161--170", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2764545", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8074745/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jin:2018:LST, author = "Ma Jin and Yan Song and Ian McLoughlin and Li-Rong Dai", title = "{LID}-Senones and Their Statistics for Language Identification", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "171--183", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2766023", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8080255/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2018:PJM, author = "Zhehuai Chen and Jasha Droppo and Jinyu Li and Wayne Xiong", title = "Progressive Joint Modeling in Unsupervised Single-Channel Overlapped Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "184--196", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2765834", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8080252/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ranjan:2018:CLB, author = "Shivesh Ranjan and John H. L. Hansen", title = "Curriculum Learning Based Approaches for Noise Robust Speaker Recognition", journal = j-IEEE-ACM-TASLP, volume = "26", number = "1", pages = "197--210", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2765832", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8080267/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bando:2018:SEB, author = "Yoshiaki Bando and Katsutoshi Itoyama and Masashi Konyo and Satoshi Tadokoro and Kazuhiro Nakadai and Kazuyoshi Yoshii and Tatsuya Kawahara and Hiroshi G. Okuno", title = "Speech Enhancement Based on {Bayesian} Low-Rank and Sparse Decomposition of Multichannel Magnitude Spectrograms", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "215--230", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772340", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8103886/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ruan:2018:SNE, author = "Yu-Ping Ruan and Qian Chen and Zhen-Hua Ling", title = "A Sequential Neural Encoder With Latent Structured Description for Modeling Sentences", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "231--242", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2773198", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8106781/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gully:2018:DSU, author = "Amelia J. Gully and Helena Daffern and Damian T. Murphy", title = "Diphthong Synthesis Using the Dynamic {$3$D} Digital Waveguide Mesh", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "243--255", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2774921", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114217/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2018:IIR, author = "Chunyang Wu and Mark J. F. Gales and Anton Ragni and Penny Karanasou and Khe Chai Sim", title = "Improving Interpretability and Regularization in Deep Learning", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "256--265", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2774919", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114209/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2018:NAS, author = "Kehai Chen and Tiejun Zhao and Muyun Yang and Lemao Liu and Akihiro Tamura and Rui Wang and Masao Utiyama and Eiichiro Sumita", title = "A Neural Approach to Source Dependence Based Context Model for Statistical Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "266--280", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772846", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8105847/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nikunen:2018:SMS, author = "Joonas Nikunen and Aleksandr Diment and Tuomas Virtanen", title = "Separation of Moving Sound Sources Using Multichannel {NMF} and Acoustic Tracking", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "281--295", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2774925", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8114273/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sward:2018:GFF, author = "Johan Sw{\"a}rd and Hongbin Li and Andreas Jakobsson", title = "Off-Grid Fundamental Frequency Estimation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "296--303", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2775800", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8115315/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Menzies:2018:LFP, author = "Dylan Menzies and Marcos F. Sim{\'o}n G{\'a}lvez and Filippo Maria Fazi", title = "A Low-Frequency Panning Method With Compensation for Head Rotation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "304--317", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2775860", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8115309/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dropuljic:2018:VAA, author = "Branimir Dropulji{\'c} and Igor Miji{\'c} and Davor Petrinovi{\'c} and Tanja Jovanovic and Kre{\v{s}}imir {\'C}osi{\'c}", title = "Vocal Analysis of Acoustic Startle Responses", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "318--329", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2775742", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8115287/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Aichinger:2018:TMF, author = "Philipp Aichinger and Martin Hagm{\"u}ller and Berit Schneider-Stickler and Jean Schoentgen and Franz Pernkopf", title = "Tracking of Multiple Fundamental Frequencies in Diplophonic Voices", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "330--341", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2761233", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8062798/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Alexandridis:2018:MSS, author = "Anastasios Alexandridis and Athanasios Mouchtaris", title = "Multiple Sound Source Location Estimation in Wireless Acoustic Sensor Networks Using {DOA} Estimates: The Data-Association Problem", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "342--356", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2772831", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8105842/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rehr:2018:ISG, author = "Robert Rehr and Timo Gerkmann", title = "On the Importance of Super-{Gaussian} Speech Priors for Machine-Learning Based Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "357--366", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2778151", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8121999/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Djaziri-Larbi:2018:WDA, author = "Sonia Djaziri-Larbi and Ga{\"e}l Mah{\'e} and Imen Mezghani and Monia Turki and M{\'e}riem Ja{\"\i}dane", title = "Watermark-Driven Acoustic Echo Cancellation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "367--378", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2778150", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/cryptography2010.bib; https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8122007/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mesaros:2018:DCA, author = "Annamaria Mesaros and Toni Heittola and Emmanouil Benetos and Peter Foster and Mathieu Lagrange and Tuomas Virtanen and Mark D. Plumbley", title = "Detection and Classification of Acoustic Scenes and Events: Outcome of the {DCASE 2016 Challenge}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "379--393", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2778423", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8123864/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chung:2018:UDS, author = "Cheng-Tao Chung and Lin-Shan Lee", title = "Unsupervised Discovery of Structured Acoustic Tokens With Applications to Spoken Term Detection", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "394--405", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2778948", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8125178/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{May:2018:RSD, author = "Tobias May", title = "Robust Speech Dereverberation With a Neural Network-Based Post-Filter That Exploits Multi-Conditional Training of Binaural Cues", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "406--414", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2765819", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8080254/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mirbagheri:2018:RFA, author = "Majid Mirbagheri and Les Atlas and Adrian K. C. Lee", title = "Regression Factor Analysis With an Application to Continuous {HRIR} Measurement", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "415--421", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2780989", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8169044/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chien:2018:BNL, author = "Jen-Tzung Chien", title = "{Bayesian} Nonparametric Learning for Hierarchical and Sparse Topics", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "422--435", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2779862", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8141927/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Stahl:2018:PSS, author = "Johannes Stahl and Pejman Mowlaee", title = "A Pitch-Synchronous Simultaneous Detection-Estimation Framework for Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "26", number = "2", pages = "436--450", month = "????", year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2779405", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Jan 20 08:35:33 MST 2018", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "http://ieeexplore.ieee.org/document/8125741/", acknowledgement = ack-nhfb, journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:FCa, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "C1--C1", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815927", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPa, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "C2--C2", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815929", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCb, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "457--458", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2809999", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCEb, author = "Anonymous", title = "Table of Contents [Edics]", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "459--460", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2810001", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Salvador:2018:BMF, author = "C. D. Salvador and S. Sakamoto and J. Trevi{\~n}o and Y. Suzuki", title = "Boundary Matching Filters for Spherical Microphone and Loudspeaker Arrays", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "461--474", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2778562", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic field; Acoustics; Array signal processing; array signal processing; Boundary conditions; boundary matching filters; Fourier transforms; Helmholtz equations; high-definition spatial audio; high-resolution arrays; integral equations; KHIE; Kirchhoff Helmholtz integral equation; Kirchhoff-Helmholtz integral equation; loudspeaker array signals; loudspeaker arrays; Loudspeakers; loudspeakers; matched filters; microphone array signals; Microphone arrays; microphone arrays; open reproduction boundary; physical boundary conditions; rigid recording boundary; sound field reconstruction; sound field recording; sound field reproduction; sound fields; Spatial audio; spatial discretization effects; spatial effects; spectral effects; spherical array; spherical array signal conversion; spherical Fourier transform; spherical harmonic functions; spherical microphone; temporal effects; transform domain; transform-domain signal conversion filters", } @Article{Abdelaziz:2018:CFM, author = "A. H. Abdelaziz", title = "Comparing Fusion Models for {DNN}-Based Audiovisual Continuous Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "475--484", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2783545", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustics; audio-visual systems; audiovisual automatic speech recognition; audiovisual automatic speech recognition (AV-ASR) benchmarks; audiovisual continuous speech recognition; audiovisual fusion; audiovisual fusion models; Audiovisual speech recognition; automatic lipreading; clean-train-clean-test; clean-train-noisy-test; coupled HMM; decision fusion model; feature fusion model; hidden Markov models; Hidden Markov models; Markov model; multistream hidden Markov model (HMM); neural nets; Noise measurement; noisy acoustic signals; novel LVCSR AV-ASR models; phone recognition; Speech; speech recognition; Speech recognition; turbo decoders; Visualization; vocabulary continuous speech recognition models", } @Article{Emura:2018:RER, author = "S. Emura", title = "Residual Echo Reduction for Multichannel Acoustic Echo Cancelers With a Complex-Valued Residual Echo Estimate", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "485--500", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2782004", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; Acoustics; AEC; bias model; Coherence; coherence estimation; complex-valued residual echo estimate; conventional residual echo reduction methods; echo reduction; echo suppression; echo-path change; far-end signals; far-end talker change; frequency responses; Frequency-domain analysis; Loudspeakers; Microphones; Multichannel acoustic echo canceler; multichannel acoustic echo cancelers; residual echo; Speech; speech processing; Speech processing; Wiener filters", } @Article{Do:2018:MLP, author = "V. H. Do and N. F. Chen and B. P. Lim and M. A. Hasegawa-Johnson", title = "Multitask Learning for Phone Recognition of Underresourced Languages Using Mismatched Transcription", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "501--514", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2782360", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic modeling; acoustic signal processing; Acoustics; Adaptation models; annotation language; Data models; Gaussian Mixture Model; Gaussian processes; hidden Markov models; Hidden Markov models; Hidden-Markov Model; learning (artificial intelligence); matched target-language graphemes; mismatched annotation-language graphemes; mismatched transcription; multi-task learning; multitask learning framework; natural language processing; neural nets; Phone recognition; Probabilistic logic; probabilistic transcription; Speech; speech audio; speech processing; speech recognition; Speech recognition; under-resourced languages; underresourced language", } @Article{Zohourian:2018:BSL, author = "M. Zohourian and G. Enzner and R. Martin", title = "Binaural Speaker Localization Integrated Into an Adaptive Beamformer for Hearing Aids", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "515--528", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2782491", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "adaptive binaural beamformer; array signal processing; Array signal processing; Azimuth; beamforming; beamforming techniques; binaural hearing aids; binaural localization; Binaural source localization; binaural speaker localization; Cost function; Direction-of-arrival estimation; direction-of-arrival estimation; Estimation; feature extraction; hearing aids; hearing-aids; interference suppression; localization algorithms; maximum likelihood estimation; Microphones; source separation; speaker recognition; Speech; speech enhancement", } @Article{Xiang:2018:SSA, author = "Y. Xiang and I. Natgunanathan and D. Peng and G. Hua and B. Liu", title = "Spread Spectrum Audio Watermarking Using Multiple Orthogonal {PN} Sequences and Variable Embedding Strengths and Polarities", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "529--539", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2782487", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio coding; audio data; audio signal; audio signal processing; Audio watermarking; audio watermarking; compression attacks; copyright; Copyright protection; copyright protection; Discrete cosine transforms; Electronic mail; embedding capacity; existing audio watermarking methods; high robustness; Interference; Multiple Orthogonal PN Sequences; noise addition; Robustness; Speech; spread spectrum; spread spectrum audio watermarking; SS-based audio watermarking method; Variable Embedding Strengths; watermark bits; Watermarking", } @Article{Tan:2018:CAA, author = "C. Tan and F. Wei and Q. Zhou and N. Yang and B. Du and W. Lv and M. Zhou", title = "Context-Aware Answer Sentence Selection With Hierarchical Gated Recurrent Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "540--549", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2785283", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Analytical models; answer sentence selection; artificial intelligence; candidate sentence; comprehension style answer sentence selection; context independent matching; context information; Context modeling; context-aware answer sentence selection; hierarchical gated recurrent neural networks; hierarchical neural networks; Logic gates; natural language processing; Question answering; question answering (information retrieval); recurrent neural nets; Recurrent neural networks; Semantics; sentence level recurrent neural network; SQuAD datasets; WikiQA datasets; word level recurrent neural network", } @Article{Zhang:2018:MSS, author = "J. Zhang and S. P. Chepuri and R. C. Hendriks and R. Heusdens", title = "Microphone Subset Selection for {MVDR} Beamformer Based Noise Reduction", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "550--563", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2786544", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "array signal processing; candidate sensors; computational complexity; convex optimization; convex optimization techniques; convex programming; correlation matrices; correlation methods; data-driven approach; dynamic scenarios; Estimation; greedy algorithm; greedy algorithms; greedy strategy; informative sensors; matrix algebra; microphone subset selection; Microphones; minimum variance distortionless response beamformer based noise reduction; model-driven scheme; MVDR; MVDR beamformer; Noise reduction; noise reduction; output noise power; radius-based beamformer; sensor measurements; Sensor selection; sensor selection problem; Sensors; Signal to noise ratio; signal-to-noise ratio; sparse MVDR; sparsity; Speech; Speech processing; statistical analysis; statistical information; transmission power; WASN; wireless acoustic sensor networks; wireless sensor networks", } @Article{Wang:2018:SSWa, author = "S. Wang and P. Lin and Y. Tsao and J. Hung and B. Su", title = "Suppression by Selecting Wavelets for Feature Compression in Distributed Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "564--579", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2779787", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "back-end server; client terminal; compressed features; compression rate; compression stage; data compression; data processing; data transmission efficiency; device requirements; Discrete wavelet transform; discrete wavelet transform; discrete wavelet transforms; Discrete wavelet transforms; distributed speech recognition; down-sampling process; DSR; DWT; feature compression; feature compression algorithm; feature extraction; Feature extraction; feature extraction; feature sequence temporal properties; Frequency modulation; high frequency counterpart; incoming speech feature sequence; incoming stream; low frequency subsequence; low-frequency subsequence; Mandarin Chinese news corpus; memory minimization; mobile device; network server; noise-robustness techniques; oversmoothing effects; recognition performance; recognition tasks; remote network; Servers; specific feature statistics normalization; Speech; Speech recognition; speech recognition; SSW; SSW approach; standard robustness task; statistics; statistics normalization; suppression by selecting wavelets; temporal subsequences; wireless channel; wireless channels", } @Article{Wang:2018:MBS, author = "Y. Wang and M. Brookes", title = "Model-Based Speech Enhancement in the Modulation Domain", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "580--594", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2786863", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "competitive algorithms; complex domain; Cost function; estimated dynamics; Gaussring-model; Kalman filter; Kalman filters; least mean squares methods; minimum mean-square error (MMSE) estimator; MMSE estimation; Modulation; modulation-domain Kalman filter; modulation-domain speech enhancement; noise amplitudes; Noise measurement; segmental SNR measure; short-time objective intelligibility measure; spectral amplitudes; Speech; speech amplitudes; Speech enhancement; speech enhancement; Speech enhancement; speech intelligibility; speech quality measure; speech recognition experiments; statistical Gaussring model; statistical modelling", } @Article{Huemmer:2018:EPN, author = "C. Huemmer and C. Hofmann and R. Maas and W. Kellermann", title = "Estimating Parameters of Nonlinear Systems Using the Elitist Particle Filter Based on Evolutionary Strategies", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "595--608", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2788183", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic distortion; approximated continuous posterior distribution; Atmospheric measurements; Bayes methods; classical particle filtering; elitist particle filter; elitist particles; EPFES; Estimation; evolutionary computation; evolutionary elitist-particle selection scheme; evolutionary strategies; FIR filters; Gaussian particle filter; instantaneously calculated particle weights; latent state vector; linear FIR filter; long-term information; loudspeakers; Loudspeakers; nonlinear acoustic echo path; nonlinear acoustics; nonlinear parameter estimation; nonlinear system; Nonlinear systems; parameter estimation; particle filter; particle filtering (numerical methods); Particle measurements; Probability density function; published elitist-particle selection process; single-channel nonlinear acoustic echo cancellation; State-space model; statistical distributions; time-variant latent state; univariate nonstationary growth model", } @Article{Salvati:2018:LCR, author = "D. Salvati and C. Drioli and G. L. Foresti", title = "A Low-Complexity Robust Beamforming Using Diagonal Unloading for Acoustic Source Localization", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "609--622", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2789321", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic analysis; acoustic array processing; acoustic arrays; acoustic signal processing; acoustic source localization; Acoustics; array output vector; Array signal processing; array signal processing; broadband robust beamforming; Complexity theory; computational complexity; Covariance matrices; covariance matrices; data-dependent covariance matrix conditioning method; Diagonal unloading beamforming; diagonal unloading transformation method; direction of arrival estimation; DU beamformer localization performance; DU beamformer method; DU beamforming; eigenvalues and eigenfunctions; filtering theory; low-complexity robust beamforming; microphone array; Multiple signal classification; multiple signal classification method; noisy signal space; opportune diagonal matrix; radiating sound source; real acoustic data; response power beamforming; robust localization; robust minimum variance distortionless response filter; Robustness; Sensors; signal classification; signal subspace", } @Article{Su:2018:HSA, author = "J. Su and J. Zeng and D. Xiong and Y. Liu and M. Wang and J. Xie", title = "A Hierarchy-to-Sequence Attentional Neural Machine Translation Model", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "623--632", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2789721", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "attention models; Chinese-English translation; clause level; Context modeling; conventional NMT model; Decoding; English-German translation; grammars; hierarchical neural network structure; Hierarchy-to-sequence; hierarchy-to-sequence attentional neural machine translation model; hierarchy-to-sequence attentional NMT model; language translation; learning (artificial intelligence); long parallel sentences; natural language processing; neural machine translation; neural nets; optimal model parameters; parameter learning; recurrent neural nets; Recurrent neural networks; recurrent neural networks; segmented clause sequence; segmented clauses; semantic compositionality modeling; Semantics; sequence-to-sequence attentional neural machine translation; short clauses; Speech; Speech processing; text analysis; Training; translation prediction", } @Article{Kheder:2018:UJM, author = "W. B. Kheder and D. Matrouf and M. Ajili and J. Bonastre", title = "A Unified Joint Model to Deal With Nuisance Variabilities in the $i$-Vector Space", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "633--645", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2789399", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic corruptions; acoustic nuisances; acoustic signal processing; Acoustics; Additive noise; additive noise; baseline system performance; Computational modeling; corrupted test i-vector; data-driven nuisance compensation technique; i-vector; i-vector space; i-vectors framework; joint modeling; least mean squares methods; nuisance variabilities; Robustness; short utterance; speaker recognition; speaker recognition technology; Speaker verification; Speech; Speech processing; SR systems; Training; unified joint model; vectors", } @Article{Gelly:2018:ORB, author = "G. Gelly and J. Gauvain", title = "Optimization of {RNN}-Based Speech Activity Detection", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "646--656", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2769220", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Artificial neural networks; automatic speech recognition systems; back-end parameters; CG-LSTM model; coordinated-gate LSTM network; downstream speech recognizer; Error analysis; feature extraction; frame error rate; long short-term memory; NIST 2015 SAD evaluation data; NIST detection cost function; nondifferentiable optimization problems; Optimization; particle swarm optimisation; particle swarm optimization; recurrent neural nets; recurrent neural network; Recurrent neural networks; recurrent neural networks; RNN models; SAD optimization; short-term memory network; Smoothing methods; Speech; Speech activity detection; speech activity detection; speech recognition; word error rate", } @Article{Taseska:2018:BSS, author = "M. Taseska and E. A. P. Habets", title = "Blind Source Separation of Moving Sources Using Sparsity-Based Source Detection and Tracking", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "657--670", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2780993", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic source tracking; approximate Bayesian tracker; Bayes methods; blind source separation; blind source separation algorithms; BSS filters; estimated statistics; independent vector analysis-based BSS algorithms; measurement-to-source association probabilities; microphone arrays; Microphone arrays; Narrowband; noise reduction capabilities; optimal spatial filters; pattern clustering; Position measurement; probability; PSD matrix estimation; short time-frequency domain; source separation; source signals; Spatial filtering; spatial filters; spatially separated microphone arrays; Speech; Speech processing; TF bin associations; time-frequency bin", } @Article{Yu:2018:RWE, author = "L. Yu and J. Wang and K. R. Lai and X. Zhang", title = "Refining Word Embeddings Using Intensity Scores for Sentiment Analysis", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "671--681", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2788182", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Context modeling; dissimilar intensity scores; fine-grained sentiment classification; labeled corpora; low-dimensional vector representations; natural language processing tasks; Neural networks; opposite sentiment polarity; pretrained word embeddings; pretrained word vectors; refinement process; Semantics; Sentiment analysis; sentiment analysis; Sentiment analysis; sentiment embeddings; sentiment intensity scores; sentiment lexicons; sentimentally dissimilar words; Speech; Speech processing; sufficient sentiment information; word embeddings; word vector refinement; word vector refinement model; Word2vec", } @Article{Dorfan:2018:DEM, author = "Y. Dorfan and A. Plinge and G. Hazan and S. Gannot", title = "Distributed Expectation-Maximization Algorithm for Speaker Localization in Reverberant Environments", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "682--695", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2788198", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustic measurements; acoustic radiators; acoustic source localization; active speakers; auditory scene analysis; complex-valued Gaussian mixture model; Direction-of-arrival estimation; distributed algorithms; distributed expectation-maximization; Estimation; expectation-maximisation algorithm; extreme conditions; filter the measurements; Gaussian processes; hearing; high localization accuracy; human hearing mechanisms; incremental expectation-maximization; Microphones; mixture models; modified incremental distributed expectation-maximization algorithm; multi-path; multipath conditions; multiple subbands; onset dominance; original IDEM framework; phase difference measurements; Precedence effect; real-valued truncated Gaussian mixture; reverberant environments; reverberation; Reverberation; sound source localization; speaker localization; spectral masking; Speech; speech processing; Speech processing; time difference of arrival; time difference of arrival measurements; time-of-arrival estimation; truncated Gaussian", } @Article{Anonymous:2018:IATa, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "696--697", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815931", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ITMa, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "698--699", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815933", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:OAa, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "700--700", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2816479", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:IICa, author = "Anonymous", title = "Introducing {IEEE Collabratec}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "701--701", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2816481", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPb, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "C3--C3", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815935", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:BPa, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "26", number = "3", pages = "C4--C4", month = mar, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815937", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:FCb, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "C1--C1", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815959", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPc, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "C2--C2", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815961", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCc, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "696--697", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815499", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCEc, author = "Anonymous", title = "Table of Contents [Edics]", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "698--699", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815501", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tan:2018:DBS, author = "Z. Tan and M. Mak and B. K. Mak", title = "{DNN}-Based Score Calibration With Multitask Learning for Noise Robust Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "700--712", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2791105", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "calibration; Calibration; calibration algorithms; conventional calibration methods; conventional score-shift approch; Deep learning; deep neural network; DNN approach; DNN-based score calibration; i-vector pairs; i-vector speaker verification systems; learning (artificial intelligence); multi-task learning; multitask DNNs; multitask learning; neural nets; Noise measurement; noise robust speaker verification; noise robustness; Noise robustness; noise robustness; score calibration; Signal to noise ratio; speaker ID; speaker recognition; speaker verification; Speech; Training; uncalibrated scores", } @Article{Hu:2018:ESF, author = "Y. Hu and Z. Ling", title = "Extracting Spectral Features Using Deep Autoencoders With Binary Distributed Hidden Units for Statistical Parametric Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "713--724", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2791804", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic modeling; Acoustics; BDAE training method; belief networks; binary distributed hidden units; DAE; Decoding; Deep auto-encoder; deep autoencoders; deep belief network; Feature extraction; feature extraction; feedforward deep neural networks; feedforward neural nets; Hidden Markov models; model training; Neural networks; parameter generation; raw features; spectral envelopes; spectral feature extraction method; Speech; speech synthesis; SPSS systems; statistical parametric speech synthesis; Training", } @Article{Laufer-Goldshtein:2018:HAS, author = "B. Laufer-Goldshtein and R. Talmon and S. Gannot", title = "A Hybrid Approach for Speaker Tracking Based on {TDOA} and Data-Driven Models", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "725--735", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2790707", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic channel variation; Acoustic measurements; acoustic signal processing; Acoustics; associated source position; associated TDOA readings; data modalities; data-driven propagation model; distributed microphone pairs; extended Kalman filter; extended Kalman filter (EKF); Gaussian process; Gaussian processes; high-dimensional acoustic feature representation; Kalman filters; learning-based approach; low-dimensional time difference of arrival estimation; Manifolds; Microphones; microphones; noisy enclosures; nonlinear filters; observation model; observation models; relative transfer function (RTF); reverberant acoustic channels; reverberant enclosures; reverberation; signal representation; Speaker tracking; speaker tracking schemes; Speech; speech processing; Speech processing; state-space representation; statistical analysis; statistical model; TDOA estimation; time difference of arrival (TDOA); time-of-arrival estimation; Training", } @Article{Cumani:2018:SRU, author = "S. Cumani and P. Laface", title = "Speaker Recognition Using e Vectors", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "736--748", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2791806", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "accurate speaker subspace; Adaptation models; e-vector subspace; e-vectors; e-vectors systems; eigenvoice; Estimation; i vectors; i-vector systems; i-vector training; informative speaker subspace; intersession subspaces; JFA; joint factor analysis; low-dimensional subspace; speaker factors; speaker modeling approach; speaker recognition; Speaker recognition; speaker recognition evaluations; Speech; Speech processing; speech segment; Standards; text-independent speaker recognition; total variability i- vector subspace; Training; training segment; vectors", } @Article{Xu:2018:GVE, author = "L. Xu and K. A. Lee and H. Li and Z. Yang", title = "Generalizing {I}-Vector Estimation for Rapid Speaker Recognition", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "749--759", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2793670", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Baum-Welch statistics; compact representation; Computational modeling; Covariance matrices; covariance matrices; Estimation; factor representation; Gaussian processes; i-vector estimation; i-vector Gaussian formulation; Load modeling; Loading; NIST SRE 10; posterior covariance matrix; rapid computation; SOP approach; speaker recognition; Speaker verification; Speech; spoken utterance; Standards; subspace-orthogonalizing prior; text-independent speaker recognition; total variability model; vectors", } @Article{Buchris:2018:FDD, author = "Y. Buchris and I. Cohen and J. Benesty", title = "Frequency-Domain Design of Asymmetric Circular Differential Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "760--773", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2796844", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "array signal processing; asymmetric beampatterns; asymmetric circular differential microphone arrays; broadband beamforming; Circular differential microphone arrays; Frequency-domain analysis; frequency-domain analysis; frequency-domain design; Geometry; hypercardioid; microphone arrays; Microphone arrays; Multiaccess communication; Sensor arrays; supercardioid; superdirective beamformers", } @Article{Zhang:2018:ANC, author = "J. Zhang and T. D. Abhayapala and W. Zhang and P. N. Samarasinghe and S. Jiang", title = "Active Noise Control Over Space: a Wave Domain Approach", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "774--786", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2795756", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic potential energy reduction level; acoustic signal processing; active noise control; Active noise control (ANC); Adaptive algorithms; control region; fundamental problem; Harmonic analysis; loudspeaker weights; Loudspeakers; loudspeakers; Microphone arrays; minimisation; minimization problems; multichannel; Noise cancellation; noise cancellation performance; noise reduction level; Potential energy; primary noise field; reverberant room; secondary source driving signals; signal denoising; spatial noise; wave domain; wave domain approach; wave-domain active noise control algorithms; wave-domain adaptive algorithms; wave-domain residual signal coefficients; wave-domain secondary source coefficients", } @Article{Luo:2018:SIS, author = "Y. Luo and Z. Chen and N. Mesgarani", title = "Speaker-Independent Speech Separation With Deep Attractor Network", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "787--796", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2795749", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "attractor network; corresponding attractor point; deep attractor network; deep clustering; deep learning framework; deep learning methods; high-dimensional embedding space; learning (artificial intelligence); Machine learning; masker speakers; multi-talker; neural nets; Neural networks; output dimension problem; reference point; signal reconstruction; signal representation; Source separation; source separation; speaker mixtures; speaker-independent speech separation; Spectrogram; Speech; Speech processing; speech processing; speech recognition; standard signal reconstruction; Time-frequency analysis; time-frequency assignment; time-frequency embeddings; time-frequency representation", } @Article{Joy:2018:FSN, author = "N. M. Joy and S. R. Kothinti and S. Umesh", title = "{FMLLR} Speaker Normalization With {i-Vector}: In Pseudo-{FMLLR} and Distillation Framework", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "797--805", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2795754", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic modeling; acoustic signal processing; Acoustics; ASR task; augmenting i-vectors; automatic speech recognition system; decoding; deep neural networks; distillation; DNN acoustic model training; Feature extraction; feature-space maximum likelihood linear regression; FMLLR speaker normalization; generalized distillation framework; Hidden Markov models; i-vector; i-vector appended filterbank features; maximum likelihood estimation; neural nets; pseudo-FMLLR; pseudoFMLLR features; real-time scenario; regression analysis; single utterance; Speaker normalization; speaker normalizing methods; speaker recognition; speaker-specific FMLLR; Speech; Speech processing; Switchboard; time-synchronous pair; Training; Transforms; un-supervised; unsupervised speaker normalization techniques", } @Article{Chandna:2018:BAM, author = "S. Chandna and W. Wang", title = "Bootstrap Averaging for Model-Based Source Separation in Reverberant Conditions", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "806--819", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2797425", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Analytical models; audio signal processing; bootstrap averaging; expectation maximization (EM) algorithm; expectation maximization estimates; expectation-maximisation algorithm; frequency domain Gaussian mixture model; frequency-dependent GMM parameter estimates; frequency-domain analysis; Gaussian mixture model (GMM); Gaussian processes; mixture models; model-based source separation; parameter estimation; reverberant conditions; reverberant speech mixtures; Reverberation; reverberation; source separation; Source separation; spectral histogram; Speech; Speech processing; speech processing; statistical analysis; T-F masks; time-frequency (T-F) masking; Time-frequency analysis; time-frequency masks", } @Article{Tan:2018:DSV, author = "Z. Tan and M. Mak and B. K. Mak and Y. Zhu", title = "Denoised {Senone} {I}-Vectors for Robust Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "820--830", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2796843", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; backpropagation; backpropagation fine-tuning; belief networks; deep architecture; deep belief network; deep learning; denoised senone i-vectors; denoising autoencoder; denoising autoencoders; feature extraction; Feature extraction; i-vector extraction process; i-vectors; neural nets; Noise measurement; Noise reduction; noise robustness; noisy environments; phonetically discriminative acoustic features; phonetically discriminative features; Robustness; senone deep neural networks; senone posterior estimation; senone posteriors; signal denoising; speaker recognition; Speaker recognition; Speaker Verification; Speaker verification; Speech; Training", } @Article{Itakura:2018:BMA, author = "K. Itakura and Y. Bando and E. Nakamura and K. Itoyama and K. Yoshii and T. Kawahara", title = "{Bayesian} Multichannel Audio Source Separation Based on Integrated Source and Spatial Models", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "831--846", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2789320", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio signal processing; basis spectra weighted sum; Bayes methods; Bayesian models; Bayesian multichannel audio source separation; blind source separation; Computational modeling; Covariance matrices; factor-factor models; factor-mixture models; Gibbs sampling algorithms; hierarchical Bayesian models; Indexes; integrated source; latent Dirichlet allocation; latent source spectrograms; matrix decomposition; microphone array; microphone arrays; Mixture models; mixture-factor models; mixture-mixture models; Multichannel source separation; nonnegative matrix factorization; observed mixture spectrograms; source model; Source separation; source separation; source-spatial combinations; spatial factor model; spatial mixture model; spatial model; Spectrogram; statistical analysis; TF bin; time-frequency bin; unified models; unified source", } @Article{Anonymous:2018:IATb, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "847--848", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815963", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ITMb, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "849--850", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815965", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:OAb, author = "Anonymous", title = "Open Access", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "851--851", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2816483", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:IICb, author = "Anonymous", title = "Introducing {IEEE Collabratec}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "852--852", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2816485", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPd, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "C3--C3", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815967", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:BPb, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "26", number = "4", pages = "C4--C4", month = apr, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815969", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCd, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "853--854", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2830710", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCEd, author = "Anonymous", title = "Table of Contents [Edics]", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "855--856", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2830712", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Baba:2018:RGI, author = "Y. E. Baba and A. Walther and E. A. P. Habets", title = "{$3$D} Room Geometry Inference Based on Room Impulse Response Stacks", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "857--872", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2784298", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "3D room geometry inference; acoustic signal processing; acoustic wave reflection; architectural acoustics; direction-of-arrival estimation; echo labeling; Geometry; geometry; image microphones; Image model; Labeling; loudspeaker array geometry; loudspeakers; Loudspeakers; loudspeakers; Microphone arrays; microphones; real image microphone positions; reflection point localization; reflection points; reflective boundaries; reflector localization; room geometry inference; room impulse response stacks; single microphone; Three-dimensional displays; TOA disambiguation; transient response; Two dimensional displays", } @Article{Zhang:2018:LDR, author = "Q. Zhang and J. H. L. Hansen", title = "Language\slash Dialect Recognition Based on Unsupervised Deep Learning", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "873--882", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2797420", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustics; additional transcribed speech information; adversarial autoencoder; Arabic dialect corpus; bottleneck feature; dialect recognition; estimated phonetic labels; feature extraction; Feature extraction; generative modeling autoencoder; Hidden Markov models; i-Vector framework; Language/Dialect recognition; latent variable learning algorithms; natural language processing; phonetic label estimation; Speech; speech coding; speech feature processing; speech processing; Speech processing; speech recognition; Speech recognition; state-of-the-art language/dialect; Training; unsupervised bottleneck feature extraction approach; unsupervised deep learning methods; unsupervised learning; variational autoencoder", } @Article{Ling:2018:WMG, author = "Z. Ling and Y. Ai and Y. Gu and L. Dai", title = "Waveform Modeling and Generation Using Hierarchical Recurrent Neural Networks for Speech Bandwidth Extension", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "883--894", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2798811", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "bottleneck features; BWE method models; conventional BWE methods; deep neural network; dilated convolutional neural network; dilated convolutional neural networks; feedforward neural nets; generated wideband speech; generation method; Hidden Markov models; hierarchical recurrent neural networks; hierarchical structure; high-frequency waveform sample; HRNN model; input narrowband waveform samples; LSTM layers; Narrowband; narrowband speech; plain sample-level recurrent neural network based method; reconstructed wideband speech; recurrent neural nets; Recurrent neural networks; recurrent neural networks; short-term memory layers; Speech; Speech bandwidth extension; speech bandwidth extension; speech coding; Speech processing; speech quality; speech synthesis; unconditional neural audio generator; vocoders; waveform modeling methods; Wideband; wideband frequency waveform sample; wideband speech waveforms", } @Article{Delcroix:2018:CAN, author = "M. Delcroix and K. Kinoshita and A. Ogawa and C. Huemmer and T. Nakatani", title = "Context Adaptive Neural Network Based Acoustic Models for Rapid Adaptation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "895--908", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2798821", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic context class; acoustic context information; acoustic model; acoustic model adaptation; Acoustic modeling; Acoustics; Adaptation models; adaptive training; auxiliary feature; auxiliary network; CHiME3 data; context adaptive neural network; context class weights; convolutional neural network; deep neural network; environmental adaptation; feedforward neural nets; Hidden Markov models; learning (artificial intelligence); network input; Neural networks; rapid adaptation; speaker adaptation experiments; Speech; speech recognition; speech recognition performance; Training; Training data", } @Article{Tran:2018:TMH, author = "L. T. T. Tran and S. E. Nordholm and H. Schepker and H. H. Dam and S. Doclo", title = "Two-Microphone Hearing Aids Using Prediction Error Method for Adaptive Feedback Control", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "909--923", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2798822", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "adaptive control; Adaptive feedback control; adaptive filter estimates; adaptive filters; added stable gain; AFC applications; AFC2; AFC2 method; Correlation; feedback; Feedback control; feedback path; feedback path estimation; handicapped aids; Hearing aids; hearing aids; loudspeaker signal; loudspeakers; Loudspeakers; microphone signals; Microphones; microphones; misalignment; optimal filters; PEM-AFC; PEM-AFC2; prediction error method; prefilter; relative transfer function; single-microphone single-loudspeaker systems; SMSL systems; Speech; Speech processing; speech processing; speech shaped noise; tracking rate; transfer functions; two-microphone adaptive feedback control method; two-microphone hearing aids; two-microphone single-loudspeaker hearing aid", } @Article{Chang:2018:PLM, author = "J. Chang and M. Marschall", title = "Periphony-Lattice Mixed-Order Ambisonic Scheme for Spherical Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "924--936", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2800290", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic field; acoustic signal processing; array signal processing; Array signal processing; Finite wordlength effects; Harmonic analysis; higher order ambisonics; Higher order ambisonics (HOA); HOA; horizontal performance; horizontal sound waves; horizontally incident sound waves; incident direction; Microphone arrays; microphone arrays; mixed-order ambisonics (MOA); MOA scheme; periphony-lattice mixed-order ambisonic scheme; signal reconstruction; sound field reconstruction; sound field reconstruction performance; Speech; Speech processing; spherical array layouts; spherical array of microphones; spherical beamforming; spherical harmonics coefficients; spherical harmonics expansion; spherical microphone arrays; theoretical truncation error", } @Article{Dionelis:2018:PAS, author = "N. Dionelis and M. Brookes", title = "Phase-Aware Single-Channel Speech Enhancement With Modulation-Domain {Kalman} Filtering", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "937--950", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2800525", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Correlation; enhanced speech phase spectrum; filtering theory; Fourier transforms; intelligibility metrics; Kalman filter prediction step; Kalman filter update step models; Kalman filters; modulation-domain Kalman filtering; Noise measurement; noise spectral log-amplitudes; nonlinear relations; phase-aware single-channel speech enhancement; phase-sensitive enhancement algorithm; Prediction algorithms; signal reconstruction; Spectral analysis; Speech; Speech enhancement; speech enhancement; Speech enhancement; speech enhancement algorithm; speech log-spectrum; speech phase; speech phase posterior; speech quality", } @Article{Zheng:2018:SAM, author = "C. Zheng and A. Deleforge and X. Li and W. Kellermann", title = "Statistical Analysis of the Multichannel {Wiener} Filter Using a Bivariate Normal Distribution for Sample Covariance Matrices", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "951--966", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2800283", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "bivariate normal distribution; Bivariate normal distribution; Correlation; covariance matrices; Covariance matrices; Gaussian distribution; intrinsic correlation coefficient; mean square error methods; minimum variance distortionless response beamformer; multichannel Wiener filter; MWF performance; Noise measurement; noise reduction; Noise reduction; noise sample covariance matrices; normal distribution; probability; probability density function; sample covariance matrix; Sensors; signal sampling; signal-to-noise-ratio; Speech; statistical analysis; Wiener filters", } @Article{Vaz:2018:ADU, author = "C. Vaz and V. Ramanarayanan and S. Narayanan", title = "Acoustic Denoising Using Dictionary Learning With Spectral and Temporal Regularization", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "967--980", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2800280", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic denoising; Algorithm design and analysis; CMF-WISA cost function; complex NMF; complex nonnegative matrix factorization; dictionary learning; Magnetic resonance imaging; magnetic resonance imaging scans; matrix decomposition; Noise measurement; noise modeling; Noise reduction; noise suppression; noisy spectrum; Real-time MRI; signal denoising; Spatial resolution; Speech; speech enhancement; speech+noise portions; Three-dimensional displays", } @Article{Wang:2018:PDB, author = "L. Wang and A. Cavallaro", title = "Pseudo-Determined Blind Source Separation for Ad-hoc Microphone Networks", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "981--994", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2803263", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; ad hoc networks; Ad hoc networks; Ad-hoc; ad-hoc microphone networks; asynchronous recording; blind source separation; Blind source separation; blind source separation; filtering theory; Frequency-domain analysis; ICA; incrementally source separation; independent component analysis; late-reverberation suppression; microphone arrays; Microphones; nontarget channels; over-determined mixture; overdetermined M $\times$ N mixture; power spectral density; pseudodetermined blind source separation; pseudodetermined mixture model; reference-based permutation alignment scheme; Reverberation; reverberation; sampling rate; signal sampling; sound sources; spectral postfilter; Speech; target channel; time offsets; wireless channels", } @Article{Cumani:2018:SHS, author = "S. Cumani and P. Laface", title = "Scoring Heterogeneous Speaker Vectors Using Nonlinear Transformations and Tied {PLDA} Models", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "995--1009", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2806305", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "class-dependent nonlinear transformation; e-vector; Estimation; Feature extraction; i-vector; NIST; NL-Tied-PLDA; non-linear density transformations; nonlinear tied-PLDA; PLDA; probabilistic linear discriminant analysis; probability; score heterogeneous i-vectors; scoring heterogeneous speaker vectors; speaker recognition; Speaker recognition; Speech; Speech processing; Speech recognition; test i-vectors; text-independent speaker recognition systems; Tied PLDA models; vectors", } @Article{Bernardi:2018:SOS, author = "G. Bernardi and T. {van Waterschoot} and J. Wouters and M. Moonen", title = "Subjective and Objective Sound-Quality Evaluation of Adaptive Feedback Cancellation Algorithms", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "1010--1024", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2808042", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic feedback; acoustic feedback control; Acoustics; Adaptive feedback cancellation (AFC); adaptive feedback cancellation algorithms; adaptive filters; AFC; application-specific objective measures; audio signal processing algorithms; block normalized least mean square algorithm; feedback; frequency-domain adaptive filter; frequency-domain adaptive filter (FDAF); frequency-domain analysis; Frequency-domain analysis; frequency-domain Kalman filter; Kalman filter; Kalman filters; least mean squares methods; Loudspeakers; music signals; objective sound-quality evaluation; PEM-FDKF; perceptual sound-quality evaluation; Prediction algorithms; prediction-error method; prediction-error method (PEM); Signal processing algorithms; Speech; Speech processing; speech processing; speech signals; statistical analysis; subjective sound-quality evaluation; subjective-evaluation measures", } @Article{Anonymous:2018:IATc, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "1025--1026", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2830714", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ITMc, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "1027--1028", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2830716", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:FCc, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "C1--C1", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2830706", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPe, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "C2--C2", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2830708", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPf, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "C3--C3", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2830738", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:BPc, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "26", number = "5", pages = "C4--C4", month = may, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2830740", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:FCd, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "C1--C1", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2833599", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPg, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "C2--C2", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2833601", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCe, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1025--1026", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2833603", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCEe, author = "Anonymous", title = "Table of Contents [Edics]", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1027--1028", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2833605", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kameoka:2018:NMF, author = "H. Kameoka and T. Higuchi and M. Tanaka and L. Li", title = "Nonnegative Matrix Factorization With Basis Clustering Using Cepstral Distance Regularization", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1029--1040", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2795746", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; audio signal processing; audio source separation; Audio source separation; basis clustering; blind source separation; cepstral analysis; cepstral distance regularization; Clustering algorithms; joint optimization approach; Linear programming; magnitude spectrogram; majorization minimization algorithm; matrix decomposition; Mel frequency cepstral coefficient; mel-frequency cepstral coefficient (MFCC); mel-frequency cepstral coefficient domain; MFCC domain; music; musical instruments; NMF approach; nonnegative matrix factorization; nonnegative matrix factorization (NMF); optimisation; Optimization; polyphonic signal; Source separation; Spectrogram; time frame; time-varying amplitudes; underlying audio events; unsupervised instrument-wise source separation", } @Article{Donley:2018:MSR, author = "J. Donley and C. Ritz and W. B. Kleijn", title = "Multizone Soundfield Reproduction With Privacy- and Quality-Based Speech Masking Filters", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1041--1055", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2798804", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic contrast; Acoustics; confidential privacy; equal masking influence; frequency domain speech masker filter designs; Frequency-domain analysis; hearing; intelligibility; long term average speech spectra; Loudspeakers; loudspeakers; low-pass filters; multizone soundfield algorithms; Multizone soundfield reproduction; multizone soundfield reproduction; privacy; Privacy; quality; Silicon carbide; sound reproduction; soundfield reproduction geometry; spatial masking filters; speech; Speech; speech intelligibility; speech intelligibility contrast; speech masking filters; speech privacy; speech processing; Speech processing; speech quality mean opinion scores; target speech multizone reproduction", } @Article{Braun:2018:ECL, author = "S. Braun and A. {Kuklasi ski} and O. Schwartz and O. Thiergart and E. A. P. Habets and S. Gannot and S. Doclo and J. Jensen", title = "Evaluation and Comparison of Late Reverberation Power Spectral Density Estimators", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1056--1071", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2804172", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "array processing; Dereverberation; diffuse sound; Electronic mail; late reverberation power spectral density estimators; late reverberation PSD estimators; Maximum likelihood estimation; Microphones; multichannel Wiener filter; power spectral density estimation; Reverberation; reverberation; reverberation reduction; Spatial coherence; spatio-spectral filters; spectral analysis; Speech; speech enhancement; Speech processing; Wiener filters", } @Article{Benaroya:2018:BLM, author = "E. L. Benaroya and N. Obin and M. Liuni and A. Roebel and W. Raumel and S. Argentieri", title = "Binaural Localization of Multiple Sound Sources by Non-Negative Tensor Factorization", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1072--1082", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2806745", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio signal processing; binaural head; binaural localization; Binaural localization; binaural sound source localization; blind source separation; computational audio scene analysis; Ear; Image analysis; matrix decomposition; multichannel audio signals; multiple sound sources; non-negative tensor factorization; nonnegative factorization; nonnegative tensor factorization; robot audition; Robot kinematics; sound source position; Speech; Speech processing; Tensile stress; tensors", } @Article{Perraudin:2018:ILA, author = "N. Perraudin and N. Holighaus and P. Majdak and P. Balazs", title = "Inpainting of Long Audio Segments With Similarity Graphs", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1083--1094", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2809864", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Audio imputation; audio inpainting; audio restoration; audio signal processing; audio signals; audio similarity graphs; candidate segment; concealment; concealment of data loss; distorted signal region; Distortion; extensive listening tests; graph theory; intuitive optimization scheme; long audio segments inpainting; long duration data loss compensation; lost content; lost signal region; Multiple signal classification; Music; music; music recovery; optimisation; real-world music signals; Redundancy; signal defects; signal structure; similarity graphs; Speech; Time-frequency analysis; time-persistent spectral similarity", } @Article{Magron:2018:MBS, author = "P. Magron and R. Badeau and B. David", title = "Model-Based {STFT} Phase Recovery for Audio Source Separation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1095--1105", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2811540", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Approximation algorithms; audio signal processing; audio source separation; auxiliary function method; complex-valued STFT; Fourier transforms; Frequency estimation; Harmonic analysis; iterative source separation procedure; Phase recovery; phase unwrapping; short-time Fourier transform; sinusoidal modeling; source separation; Source separation; Speech; Speech processing; STFT phase increment; STFT phase recovery; time-domain analysis; time-domain signals; Time-frequency analysis; Wiener filters; Wiener-like filtering", } @Article{Kodrasi:2018:AED, author = "I. Kodrasi and S. Doclo", title = "Analysis of Eigenvalue Decomposition-Based Late Reverberation Power Spectral Density Estimation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1106--1118", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2811184", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "computational complexity; Dereverberation; eigenvalue decomposition; eigenvalues and eigenfunctions; Estimation error; estimation errors; EVD; EVD-based PSD estimator; filtering theory; late reverberation power spectral density estimation; late reverberation PSD estimator; maximum likelihood based PSD estimator; maximum likelihood estimation; Microphones; ML; ML based PSD estimator; modeling errors; multichannel methods; multichannel Wiener filter; Noise measurement; prewhi-tening; PSD estimate; PSD estimation; relative transfer functions; reverberant speech PSD matrix; reverberation; Reverberation; Spatial coherence; spatial coherence matrix; spectral analysis; Speech; speech dereverberation techniques; speech processing; transfer functions; Wiener filters", } @Article{Braun:2018:LPB, author = "S. Braun and E. A. P. Habets", title = "Linear Prediction-Based Online Dereverberation and Noise Reduction Using Alternating {Kalman} Filters", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1119--1129", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2811247", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; alternating Kalman filters; alternating minimization; autoregressive model; autoregressive processes; causality problem; Dereverberation; Estimation; Fourier transforms; Kalman filter; Kalman filters; MAR coefficients; Microphones; multichannel autoregressive coefficients; multichannel linear prediction; Noise reduction; noise-free reverberant signals; online dereverberation; online processing; optimal noise reduction; Reverberation; reverberation; reverberation reduction; sequential enhancement structures; short-time Fourier transform; signal model; Speech; speech enhancement; Speech processing; STFT domain; time-variant acoustic scenarios; transient response", } @Article{Ram:2018:SSM, author = "D. Ram and A. Asaei and H. Bourlard", title = "Sparse Subspace Modeling for Query by Example Spoken Term Detection", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1130--1143", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815780", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "AMI database; deep neural network; Dictionaries; dynamic programming; dynamic programming framework; feature extraction; Feature extraction; low-dimensional subspaces; MediaEval database; Mel frequency cepstral coefficient; Neural networks; phone posterior features; posterior probabilities; QbE-STD systems; query by example; query by example spoken term detection; query examples; query processing; query subspace; sparse coding; sparse model recovery; sparse reconstruction errors; sparse recovery modeling; sparse representation; sparse structure; sparse subspace modeling; Speech; Speech processing; speech processing; spoken query; spoken term detection; standard template matching; subspace detection; subspace regularization; Task analysis; template matching likelihood; template matching techniques; temporal structure; zero-resource scenario", } @Article{Krawczyk-Becker:2018:SEU, author = "M. Krawczyk-Becker and T. Gerkmann", title = "On Speech Enhancement Under {PSD} Uncertainty", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1144--1153", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2816241", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "available speech PSD estimates; Bayes methods; Bayesian clean speech estimators; derived statistical framework; Malah's amplitude estimators; Maximum likelihood estimation; modern PSD estimators; musical noise; Noise measurement; Noise reduction; novel nonlinear clean speech estimator; power spectral densities; power spectral density; PSD estimation errors; PSD uncertainty; robust speech enhancement performance; spectral analysis; Speech; Speech enhancement; speech enhancement; speech estimation errors; statistical analysis; typical speech PSDs; Uncertainty; uncertainty; well-known conventional clean speech estimators", } @Article{Leglaive:2018:SSM, author = "S. Leglaive and R. Badeau and G. Richard", title = "{Student}'s $t$-Source and Mixing Models for Multichannel Audio Source Separation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1154--1168", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2813011", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio signal processing; Audio source separation; Bayes methods; Bayesian framework; blind source separation; convolution; convolutive mixing process; filtering theory; matrix decomposition; mixing filters; multichannel audio source separation; multichannel reverberant mixtures; Music; musical signals; non-negative matrix factorization; nonnegative matrix factorization model; Probabilistic logic; Random variables; simple characteristic structure; simple probabilistic priors; source separation; Source separation; specific structure; statistical distributions; statistical room acoustics; student t distribution; student t source and mixing models; Student's t distribution; Time-domain analysis; Time-frequency analysis; time-frequency analysis; time-frequency domain; transient response; under-determined audio source separation; variational inference", } @Article{Anonymous:2018:IATd, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1169--1170", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2833607", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ITMd, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "1171--1172", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2833609", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPh, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "C3--C3", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2833611", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:BPd, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "26", number = "6", pages = "C4--C4", month = jun, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2833613", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:FCe, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "C1--C1", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855859", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPi, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "C2--C2", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855861", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCf, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "1173--1174", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2834199", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCEf, author = "Anonymous", title = "Table of Contents [Edics]", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "1175--1176", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2834201", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yoshimura:2018:MCB, author = "T. Yoshimura and K. Hashimoto and K. Oura and Y. Nankaku and K. Tokuda", title = "Mel-Cepstrum-Based Quantization Noise Shaping Applied to Neural-Network-Based Speech Waveform Synthesis", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "1177--1184", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2818408", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "approximation theory; cepstral analysis; Feature extraction; filtering theory; human auditory perception; mel-cepstral coefficients; mel-cepstrum; mel-cepstrum-based quantization noise shaping method; mel-log spectrum approximation filter; neural nets; neural-network-based speech waveform synthesis system; noise shaping; Noise shaping; quantisation (signal); quantization; Quantization (signal); Speech; Speech processing; speech quality; speech synthesis; Speech waveform synthesis; synthetic speech; Vocoders; WaveNet; WaveNet generative model; white noise; White noise; white noise", } @Article{Wang:2018:MLE, author = "Q. Wang and J. Du and L. Dai and C. Lee", title = "A Multiobjective Learning and Ensembling Approach to High-Performance Speech Enhancement With Compact Neural Network Architectures", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "1185--1197", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2817798", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "7-frame input expansion; cepstral analysis; clean GFCC; clean LPS; clean MFCC; clean speech feature; compact and low-latency design; compact DNNs; compact neural network architectures; deep neural network (DNN); deep neural network architecture; dynamic noise feature; ensembling approach; estimated clean features; feature extraction; Gaussian processes; hidden Markov models; high-performance speech enhancement; IRM; learned features; learning (artificial intelligence); log-power spectra; lowlatency design; Mel frequency cepstral coefficient; MOE-DNN; MOL-DNN; MOLE approach; multiobjective ensembling; multiobjective ensembling DNN; multiobjective learning; multiobjective learning DNN; multiobjective set; multiple features; neural net architecture; Neural networks; Noise measurement; regression analysis; SE system; Speech; Speech enhancement; speech enhancement; Speech enhancement (SE); weak models; weak regression functions", } @Article{Del-Agua:2018:SAC, author = "M. {\'A}. Del-Agua and A. Gim{\'e}nez and A. Sanchis and J. Civera and A. Juan", title = "Speaker-Adapted Confidence Measures for {ASR} Using Deep Bidirectional Recurrent Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "1198--1206", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2819900", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Adaptation models; ASR; automatic speech recognition; Automatic speech recognition; Computer architecture; confidence estimation; confidence measures; DBLSTM; DBRNN; deep bidirectional recurrent neural networks; English LibriSpeech; long short-term memory; long short-term memory cells; natural language processing; nonadapted confidence measures; recurrent neural nets; Recurrent neural networks; recurrent neural networks-based confidence classifiers; RNN; Spanish PoliMedia tasks; speaker adaptation; speaker-adapted confidence measures; Speech; speech corpus; Speech processing; speech recognition; Task analysis; TED-LIUM corpus; Training; unsupervised adaptation method", } @Article{Proenca:2018:MDC, author = "J. Proen{\c{c}}a and C. Lopes and M. Tjalve and A. Stolcke and S. Candeias and F. Perdig{\~a}o", title = "Mispronunciation Detection in Children's Reading of Sentences", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "1207--1219", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2820429", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "automatic assessment; automatic reading annotation; automatic reading tutors; automatic segmentation; candidate segmentation; candidate word pronunciations; children sentence reading; children's reading; correct pronunciation; Decoding; Electronic mail; feature extraction; Grammar; Hidden Markov models; log-likelihood ratio; manual segmentation; Measurement; mispronunciation classification; mispronunciation detection; natural language processing; phoneme recognition approaches; segmentation stage; Speech; Speech analysis; spotting approach; Task analysis; word candidates; word pronunciation; word spotting model", } @Article{Stankovic:2018:ARS, author = "Ljubi{\v{s}}a Stankovi{\'c} and Milo{\v{s}} Brajovi{\'c}", title = "Analysis of the Reconstruction of Sparse Signals in the {DCT} Domain Applied to Audio Signals", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "1220--1235", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2819819", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "approximately sparse signals; audio signal processing; Audio signals; compressed sensing; compressive sensing methods; computationally efficient reconstruction algorithm; DCT coefficients; DCT domain; digital signal processing; discrete cosine transform; discrete cosine transforms; Discrete cosine transforms; Discrete Fourier transforms; disturbance scenarios; experimental signals; mean square error methods; mean-square reconstruction error; nonsparse noisy signals; recorded audio signals; reduced set; signal reconstruction; signal representation; signal samples; signal sampling; sparse audio signal processing; sparse signal processing; Speech; Speech processing; statistical properties; synthetic signals; unique reconstruction conditions", } @Article{Santos:2018:SDC, author = "J. F. Santos and T. H. Falk", title = "Speech Dereverberation With Context-Aware Recurrent Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "1236--1246", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2821899", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "architectural acoustics; context information; Context modeling; context-aware recurrent neural networks; Convolution; convolutional codes; convolutional encoder; deep learning; Dereverberation; Feature extraction; feature extraction; high reverberation times; long-term dependencies; long-term information; perceived reverberation; perceptual evaluation; perceptual objective listening quality assessment; recurrent neural nets; recurrent neural network; recurrent neural networks; reverberant counterpart; reverberant speech; Reverberation; reverberation; reverberation time; short-time objective intelligibility; simulated room impulse responses; spectral magnitude; Speech; speech coding; speech dereverberation; speech enhancement; Speech enhancement; speech intelligibility; speech quality; Time-frequency analysis", } @Article{Geronazzo:2018:DWN, author = "M. Geronazzo and S. Spagnol and F. Avanzini", title = "Do We Need Individual Head-Related Transfer Functions for Vertical Localization? The Case Study of a Spectral Notch Distance Metric", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "1247--1260", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2821846", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustics; anthropometry; audio signal processing; auditory elevation perception; auditory model; auditory models; Computational modeling; Databases; dummy-head HRTF; head-related transfer function rendering process; head-related transfer functions (HRTFs); hearing; HRTF selection; HRTF spectra; image processing; individual head-related transfer functions; individualized HRTFs; nonindividual HRTF set; personalized HRTF set; Psychoacoustic models; psychoacoustically motivated anthropometry based mismatch function; random HRTF selection; rendering (computer graphics); Spatial audio; spectral notch distance; spectral notch metric; Speech; Speech processing; transfer functions; Transfer functions; vertical localization", } @Article{Marquardt:2018:ICP, author = "D. Marquardt and S. Doclo", title = "Interaural Coherence Preservation for Binaural Noise Reduction Using Partial Noise Estimation and Spectral Postfiltering", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "1261--1274", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2823081", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "array signal processing; Auditory system; beamforming; binaural cues; binaural multichannel Wiener filter; binaural MVDR beamformer; binaural MWF; binaural noise reduction; binaural speech enhancement algorithms; closed-form expression; Coherence; computational complexity; diffuse noise scenarios; Distortion; estimation theory; hearing aids; Integrated circuits; interaural coherence; interaural coherence preservation; Microphones; minimum-variance-distortionless response; Multi-channel Wiener filter; MVDR-IC; MVDR-N; MWF-IC; MWF-N; noise reduction; Noise reduction; noise reduction performance; partial noise estimation; quasidistortionless version; signal denoising; single desired speech source; spectral postfilter; Speech; speech enhancement; undesired noise component; Wiener filters", } @Article{Farmani:2018:BCI, author = "M. Farmani and M. S. Pedersen and Z. Tan and J. Jensen", title = "Bias-Compensated Informed Sound Source Localization Using Relative Transfer Functions", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "1275--1289", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2825110", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; ambient noise characteristics; bias-compensated informed sound source localization; binaural configurations; binaural microphone array configurations; computational complexity; Databases; direction of arrival estimation; direction-of-arrival estimation; Direction-of-arrival estimation; DoA estimator; DoA-dependent relative transfer functions; HA microphones; hearing aid; hearing aid system; hearing aids; Hearing aids; information fusion strategy; lower computational complexity; maximum likelihood; Maximum likelihood estimation; maximum likelihood estimation; maximum-likelihood approach; microphone arrays; microphone signals; Microphones; monaural microphone array configurations; noise-free target speech; received signals; relative transfer function; reverberation; sensor fusion; shadowing effect; Sound source localization; Speech; target sound direction; transfer functions; Wireless communication; wireless microphone informs the HA system", } @Article{Tao:2018:GNN, author = "F. Tao and C. Busso", title = "Gating Neural Network for Large Vocabulary Audiovisual Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "1290--1302", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2815268", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio-visual systems; audiovisual automatic speech recognition; audiovisual CRSS-4ENGLISH-14 corpus; Audiovisual large vocabulary automatic speech recognition; audiovisual perception process; AV-ASR; complementary information; deep learning solution; Feature extraction; gating layer; gating neural network; Gaussian processes; hidden Markov models; Hidden Markov models; human interactions; hybrid system; learning (artificial intelligence); Machine learning; Multimodal deep learning; multistream HMM system; neural nets; Noise measurement; noisy conditions; noisy features; observation models; real-world applications; Speech; speech recognition; Speech recognition; speech recognition; uninformative visual features; visual cues; Visualization; vocabulary; vocabulary audiovisual speech recognition", } @Article{Anonymous:2018:IATe, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "1303--1304", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855863", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ITMe, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "1305--1306", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855865", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPj, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "C3--C3", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855867", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:BPe, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "26", number = "7", pages = "C4--C4", month = jul, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855869", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:FCf, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "C1--C1", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855871", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPk, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "C2--C2", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855873", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCg, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "1303--1304", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2834279", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCEg, author = "Anonymous", title = "Table of Contents [Edics]", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "1305--1306", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2834281", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rafii:2018:OLA, author = "Z. Rafii and A. Liutkus and F. St{\"o}ter and S. I. Mimilakis and D. FitzGerald and B. Pardo", title = "An Overview of Lead and Accompaniment Separation in Music", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "1307--1335", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2825440", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "accompaniment; accompaniment separation; audio signal processing; automatic karaoke; data-centered approaches; deep learning; Lead; lead; lead component; lead separation systems; lead signal; learning (artificial intelligence); model-based methods; music; Music; music separation; musical structures; musicology; overview; particular complexity; particular difficulty; popular music; popular topic; relevant prior knowledge; remixing; Source separation; source separation; source separation yields; Spectrogram; Speech; Speech processing; Time-frequency analysis", } @Article{Wang:2018:SER, author = "C. Wang and J. Wang and A. Santoso and C. Chiang and C. Wu", title = "Sound Event Recognition Using Auditory-Receptive-Field Binary Pattern and Hierarchical-Diving Deep Belief Network", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "1336--1351", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2738443", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio signal processing; audio-visual descriptor; Auditory receptive fields binary patterns; auditory-receptive-field binary pattern; automatic sound event recognition; belief networks; cepstral analysis; cepstral features; classification method; Data mining; deep neural network system; environmental sound; feature extraction; Feature extraction; Hidden Markov models; hierarchical diving deep belief network; hierarchical-diving deep belief network; human auditory receptive field model; image classification; image representation; neural nets; Neural networks; physical feature representation; practical SER system; sound event classification; sound event detection; Spectrogram; spectrogram image feature; Speech; speech recognition; Speech recognition", } @Article{Yang:2018:JPT, author = "L. Yang and M. Zhang and Y. Liu and M. Sun and N. Yu and G. Fu", title = "Joint {POS} Tagging and Dependence Parsing With Transition-Based Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "1352--1358", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2017.2788181", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Artificial neural networks; dependence parsing; dependency parsing; Dependency parsing; feature sparsity; grammars; joint model; joint modeling; Labeling; labeling conflicts; natural language processing; natural languages; Natural languages; neural nets; neural network based classifiers; neural networks; part-of-speech tagging; pattern classification; POS tagging; shift-reduce conflicts; Speech; Syntactics; Tagging; tagging conflicts; transition-based neural networks", } @Article{Yu:2018:RST, author = "K. Yu and Z. Zhao and X. Wu and H. Lin and X. Liu", title = "Rich Short Text Conversation Using Semantic-Key-Controlled Sequence Generation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "1359--1368", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2819941", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "chatbot; controllable memory trigger; Data models; Decoding; external-memory tensor; learning (artificial intelligence); Logic gates; natural language processing; Question and answer; semantic-key-controlled sequence generation; Semantics; semantics; sequence to sequence learning; sequence-to-sequence learning approach; sequence-to-sequence model; sequence-to-sequence training; sequences; short text conversation; short text conversation (STC); Speech; Speech processing; STC; text analysis; Training", } @Article{Lehner:2018:OLI, author = "B. Lehner and J. Schl{\"u}ter and G. Widmer", title = "Online, Loudness-Invariant Vocal Detection in Mixed Music Signals", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "1369--1380", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2825108", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; Feature extraction; Hidden Markov models; human singing voice expressive richness; human singing voice timbral richness; Instruments; interfering instrumental accompaniment; learning (artificial intelligence); long short-term memory recurrent neural network classifier; loudness; LSTM-RNN; machine learning; mixed music signals; music; music information retrieval; music recording; neural network; online loudness-invariant vocal detection; recurrent neural nets; signal classification; Singing voice detection; singing voice detection; sound production system; Spectrogram; Speech; Speech processing; Task analysis; VD; voice activity detection", } @Article{Stone:2018:CEP, author = "S. Stone and M. Marxen and P. Birkholz", title = "Construction and Evaluation of a Parametric One-Dimensional Vocal Tract Model", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "1381--1392", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2825601", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "aero-acoustic simulations; articulatory speech synthesis; articulatory synthesis; Computational modeling; consonant recognition rate; Electron tubes; German consonants; German vowels; higher dimensional vocal tract model; Larynx; mean square error methods; minimum root-mean-square error; onedimensional vocal tract area function; parametric one-dimensional vocal tract model; reference area functions; Shape; Solid modeling; Speech; speech production; speech recognition; speech synthesis; Three-dimensional displays; Vocal tract models; vocal tract shapes; vowel recognition rate", } @Article{Tan:2018:AVD, author = "T. Tan and Y. Qian and H. Hu and Y. Zhou and W. Ding and K. Yu", title = "Adaptive Very Deep Convolutional Residual Network for Noise Robust Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "1393--1405", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2825432", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic modeling; Adaptation models; adaptive very deep convolutional residual network; additive noise; advanced model; AMI; Aurora4; automatic speech recognition; canonical model; CAT; Cats; channel distortion; CHiME4; cluster adaptive training; convolutional neural network; deep convolutional neural networks; different noisy conditions; factor aware training; FAT; feedforward neural nets; model adaptation; Noise measurement; noise robust speech recognition; noisy environments; noisy scenarios; performance degradation; real noisy data; residual learning; reverberation; Robust speech recognition; simulated data; Speech; Speech recognition; speech recognition; superior noise robustness; system performance; Task analysis; testing conditions; Training; transcription task; VDCRN; WER; word error rate", } @Article{Wang:2018:ANF, author = "X. Wang and S. Takaki and J. Yamagishi", title = "Autoregressive Neural {F0} Model for Statistical Parametric Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "1406--1419", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2828650", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Artificial neural networks; autoregressive model; autoregressive neural F0 model; conventional mean-based generation method; DAR; data dropout strategies; Data models; F0; F0 contours; F0 datum; Feature extraction; Fundamental frequency; fundamental frequency models; Hidden Markov models; Linguistics; neural network; noisy F0 contours; nonlinear AR dependency; normal RNN; pitch; recurrent neural nets; recurrent neural networks; SAR; shallow autoregressive recurrent mixture density network; Speech; speech synthesis; statistical dependency; statistical parametric speech synthesis; temporal dependency; text-to-speech synthesis", } @Article{Valentini-Botinhao:2018:SEN, author = "C. Valentini-Botinhao and J. Yamagishi", title = "Speech Enhancement of Noisy and Reverberant Speech for Text-to-Speech", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "1420--1433", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2828980", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "additive noise data; clean data; dereverberation; enhanced synthetic voice; environmental noise; event-based scheduling; Feature extraction; generalized closed skew normal distribution; Noise measurement; noise suppression; noise-only case; noisy recordings; parallel data; recurrent neural nets; recurrent neural network; Remote state estimation; reverberant recordings; reverberant speech; Reverberation; reverberation; Speech; speech enhancement; Speech enhancement; speech enhancement methods; studio-quality recordings; text-to-speech text-to-speech; Training", } @Article{Koutrouvelis:2018:LCR, author = "A. I. Koutrouvelis and T. W. Sherson and R. Heusdens and R. C. Hendriks", title = "A Low-Cost Robust Distributed Linearly Constrained Beamformer for Wireless Acoustic Sensor Networks With Arbitrary Topology", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "1434--1448", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2829405", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "arbitrary distributed network topologies; array signal processing; cross power spectral density matrix; Distributed beamforming; Estimation error; filtering theory; LCMV; linear equality constraints; matrix algebra; Microphones; MVDR; Network topology; Noise measurement; optimisation; optimization problem; relative acoustic transfer function estimation errors; Reverberation; robust beamforming; robust distributed linearly constrained beamformer; Robustness; speech enhancement; WASN; wireless acoustic sensor network; wireless sensor networks", } @Article{Anonymous:2018:IATf, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "1449--1450", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855875", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ITMf, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "1451--1452", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855877", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPl, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "C3--C3", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855879", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:BPf, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "26", number = "8", pages = "C4--C4", month = aug, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855881", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:FCg, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "C1--C1", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855919", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPm, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "C2--C2", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855921", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCh, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1453--1454", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855923", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCEh, author = "Anonymous", title = "Table of Contents [Edics]", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1455--1456", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855925", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2018:RAD, author = "C. Wu and C. Dittmar and C. Southall and R. Vogl and G. Widmer and J. Hockman and M. M{\"u}ller and A. Lerch", title = "A Review of Automatic Drum Transcription", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1457--1483", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2830113", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "ADT research; ADT systems; ADT techniques; automatic drum transcription; automatic music transcription; classification; computational methods; deep learning; drum part; drum sound events; drum-specific variations; information retrieval; Instruments; machine learning; matrix decomposition; matrix factorization; music; Music information retrieval; music information retrieval; musical style; nonnegative matrix factorization; pattern classification; percussion; recorded music; recurrent neural nets; Rhythm; rhythm-related music processing tasks; Spectrogram; Speech processing; state-of-the-art systems; Task analysis; task-specific challenges; Transient analysis; umbrella term automatic drum transcription; Western popular music", } @Article{Evers:2018:AS, author = "C. Evers and P. A. Naylor", title = "Acoustic {SLAM}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1484--1498", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2828321", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "accurate positional information; acoustic generators; Acoustic scene mapping; acoustic signal processing; acoustic signals; Acoustic Simultaneous Localization; Acoustic SLAM; acoustic sources; array signal processing; Bayes methods; consequent false DoA estimates; Direction-of-Arrival; Direction-of-arrival estimation; direction-of-arrival estimation; inactivity lead; microphones; missing DoA estimates; multiple sound sources; observer motion; Observers; positional source information; Probability density function; Reverberation; reverberation; robot audition; scene map; Simultaneous localization and mapping; simultaneous localization and mapping; SLAM (robots); sound source localization accuracy; source directions; source location estimation; source-sensor range; Speech; three-dimensional representation", } @Article{Laroche:2018:HPN, author = "C. Laroche and M. Kowalski and H. Papadopoulos and G. Richard", title = "Hybrid Projective Nonnegative Matrix Factorization With Drum Dictionaries for Harmonic\slash Percussive Source Separation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1499--1511", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2830116", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio signal; audio signal processing; audio source separation; blind source separation; Dictionaries; drum dictionaries; Harmonic analysis; harmonic source separation algorithms; harmonic/percussive decomposition; hybrid projective nonnegative matrix factorization; Instruments; matrix decomposition; Matrix decomposition; Multiple signal classification; multiplicative update rules; Music; music; music database; music signals; Nonnegative matrix factorization; orthogonal nonnegative decomposition; percussive source separation algorithms; projective nonnegative matrix factorization; short-term broadband sounds; signal representation; signal time frequency representation decomposition; smooth spectra prelearned dictionary; source separation; Source separation; sparse decomposition; sparse nonnegative decomposition; straightforward NMF decomposition; tonal part; transient part", } @Article{Carabias-Orti:2018:MBS, author = "J. J. Carabias-Orti and J. Nikunen and T. Virtanen and P. Vera-Candeas", title = "Multichannel Blind Sound Source Separation Using Spatial Covariance Model With Level and Time Differences and Nonnegative Matrix Factorization", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1512--1527", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2830105", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "achieved separation performance; audio signal processing; blind source separation; complex-valued nonnegative matrix factorization; covariance matrices; Covariance matrices; direction of arrival estimation; Direction-of-arrival estimation; direction-of-arrival estimation; direction-of-arrival kernels; DOA kernels; Euclidean distance; explicit modeling; interaural level difference; interaural time difference; Itakura-Saito divergence; Kernel; level difference covariance matrices; level differences; magnitude spectrograms; matrix decomposition; Microphones; microphones; multichannel blind sound source separation; Multichannel source separation; NMF model; non-negative matrix factorization; phase difference covariance matrices; predefined source directions; reverberation; SCM model; source localization; Source separation; source spatial covariance matrices; spatial covariance model; spatial properties; Spectrogram; time differences; Time-frequency analysis; two-channel SiSEC development dataset", } @Article{Zhang:2018:SEN, author = "M. Zhang and N. Yu and G. Fu", title = "A Simple and Effective Neural Model for Joint Word Segmentation and {POS} Tagging", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1528--1538", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2830117", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Bidirectional control; Chinese natural language processing; Chinese word segmentation; Decoding; joint model; joint word segmentation; learning (artificial intelligence); long short term memory neural network structures; Natural language processing; natural language processing; neural joint model; neural nets; Neural networks; neural networks; POS tagging; Predictive models; sequence-to-sequence neural model; Tagging; Task analysis; transition system; well-defined transition system", } @Article{Menzies:2018:CPM, author = "D. Menzies and F. M. Fazi", title = "A Complex Panning Method for Near-Field Imaging", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1539--1548", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2827300", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "adaptive panning method; Augmented reality; complex panning method; conventional amplitude panning; distant objects; Ear; extended panning method; Frequency control; Frequency-domain analysis; head orientation; hearing; image direction; Imaging; Inter-aural Level Difference cues; loudspeakers; Loudspeakers; near-field image; near-field region; single first order filter; spatial audio; Speech processing; stereo; stereo image processing; stereo panning functions; tangent law; transfer functions; VBAP", } @Article{Misra:2018:MLL, author = "A. Misra and J. H. L. Hansen", title = "Maximum-Likelihood Linear Transformation for Unsupervised Domain Adaptation in Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1549--1558", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2831460", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "domain adaptation; EM algorithm; expectation-maximisation algorithm; expectation-maximization algorithm; front-end factor analysis; Gaussian mixture model; Gaussian processes; GMM; i-Vector space; in-domain development data; maximum-likelihood linear transformation; mixture models; National Institute of Standards and Technology Speaker Recognition Evaluation; optimisation; optimization process; out-of-domain development data; probability; probability density estimation problem; speaker recognition; speaker recognition evaluation; Speaker verification; SRE-2016 corpus; transforms; unsupervised domain adaptation; unsupervised probabilistic feature transformation parameters; UPFT; vectors", } @Article{Wakabayashi:2018:SCS, author = "Y. Wakabayashi and T. Fukumori and M. Nakayama and T. Nishiura and Y. Yamashita", title = "Single-Channel Speech Enhancement With Phase Reconstruction Based on Phase Distortion Averaging", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1559--1569", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2831632", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "amplitude spectrum; Discrete Fourier transforms; fundamental frequency; Harmonic analysis; harmonic enhancement; harmonic phase spectra; harmonic structure; Noise measurement; phase distortion; phase distortion averaging; phase distortion feature; Phase reconstruction; phase reconstruction method; Reconstruction algorithms; signal reconstruction; single-channel speech enhancement; Speech enhancement; speech enhancement; speech phase spectrum; speech quality; speech signal; Time-frequency analysis; time-frequency analysis", } @Article{Fu:2018:EEW, author = "S. Fu and T. Wang and Y. Tsao and X. Lu and H. Kawai", title = "End-to-End Waveform Utterance Enhancement for Direct Evaluation Metrics Optimization by Fully Convolutional Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1570--1584", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2821903", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Automatic speech recognition; automatic speech recognition system; clean speech; direct evaluation metrics optimization; end-to-end speech enhancement; end-to-end utterance-based speech enhancement framework; end-to-end waveform utterance enhancement; evaluation criterion; FCN enhancement framework; fully convolutional neural network; fully convolutional neural networks; learning (artificial intelligence); Linear programming; long speech segments; mean square error; mean square error methods; model optimization criterion; MSE-optimized speech; neural nets; Noise measurement; noisy speech; optimisation; Optimization; perception-based objective function; raw waveform; short-time objective intelligibility measure; Speech; Speech enhancement; speech enhancement; speech intelligibility; speech recognition; STOI measure; temporal correlation information; Training; training stage", } @Article{Xiao:2018:RNS, author = "K. Xiao and S. Wang and M. Wan and L. Wu", title = "Radiated Noise Suppression for Electrolarynx Speech Based on Multiband Time-Domain Amplitude Modulation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1585--1593", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2834729", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic characteristics; amplitude modulation; artificial noise; EL speech; electrolarynx speech; Electrolarynx speech; enhancement; MTAM; multiband time-domain amplitude modulation; perceptual characteristics; radiated noise; radiated noise suppression; residual noise intensity; speech components; speech enhancement; speech intelligibility; speech quality; time-domain amplitude modulation; Wiener filters", } @Article{Fahim:2018:PES, author = "A. Fahim and P. N. Samarasinghe and T. D. Abhayapala", title = "{PSD} Estimation and Source Separation in a Noisy Reverberant Environment Using a Spherical Microphone Array", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1594--1607", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2835723", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "array signal processing; Bessel functions; coherent background noise; Correlation; Estimation; Harmonic analysis; individual power spectral density components; inherent orthogonality; microphone arrays; Microphone arrays; multisource reverberant sound scene; Noise measurement; Noise suppression; power spectral density; PSD components; PSD estimation; Reverberation; reverberation; source separation; speech dereverberation; spherical harmonics basis functions; spherical harmonics domain; spherical microphone array", } @Article{He:2018:NRF, author = "H. He and J. Chen and J. Benesty and T. Yang", title = "Noise Robust Frequency-Domain Adaptive Blind Multichannel Identification With$ \ell_p$-Norm Constraint", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1608--1619", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2835729", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "$\ell _p$-norm penalty; -norm constraint; acoustic communication (telecommunication); acoustic signal processing; Acoustics; adaptive filter; adaptive filters; Blind multichannel identification; blind source separation; channel estimation; Cost function; frequency-domain adaptive filtering; frequency-domain analysis; Frequency-domain analysis; least mean squares methods; noise robust frequency-domain adaptive blind multichannel identification; noise-free environments; RNMCFLMS algorithm; robust normalized multichannel frequency-domain least mean square algorithm; Robustness; robustness; Signal processing algorithms; SIMO system; single-input multiple-output acoustic system; sparsity; spectral flatness constraint; Speech processing; Time-domain analysis; transient response", } @Article{Zhang:2018:MEP, author = "W. Zhang and Z. Chen and F. Yin and Q. Zhang", title = "Melody Extraction From Polyphonic Music Using Particle Filter and Dynamic Programming", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1620--1632", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2834722", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; audio signal processing; Bayes methods; Bayesian filtering; Bayesian filtering framework; constant-Q transform; Data mining; Dynamic programming; dynamic programming; feature extraction; frame-wise pitches; Harmonic analysis; information retrieval; instrumental melodies; melodic contour; Melody extraction; melody extraction method; multiresolution spectral analysis; music; music information; Music information retrieval; music information retrieval; music information retrieval community; particle filter; particle filtering (numerical methods); pitch transition probability; polyphonic music; probability; publicly available dataset; rough melody contour; spectral analysis; statistical analysis; Timbre; vocal melodies", } @Article{Zhang:2018:TIS, author = "C. Zhang and K. Koishida and J. H. L. Hansen", title = "Text-Independent Speaker Verification Based on Triplet Convolutional Neural Network Embeddings", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1633--1644", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2831456", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "channel variabilities compensation; conventional speaker recognition pipelines; deep neural networks; end-to-end fashion; Euclidean distance; Euclidean distance similarity metric; feature extraction; feature representation; feedforward neural nets; fixed-length input constraint; fixed-length input speaker embedding system; fixed-length speaker discriminative embedding; front-end speaker; i-vector; Inception-Resnet-v1 architecture; learning (artificial intelligence); network training; neural network based speaker discriminative training; Neural networks; NIST; noise variabilities compensation; novel text-independent speaker verification framework; performance gain; PLDA; probabilistic linear discriminant analysis; severe test condition mismatches; severe training condition mismatches; sparse speech features; spatial pyramid pooling; spatial pyramid pooling layer; Speaker recognition; speaker recognition; Speech processing; statistical analysis; SV system; SV task; SV testing; system performance; Task analysis; testing performance; Training; triplet convolutional neural network embeddings; triplet loss; very deep convolutional neural network architecture; very deep convolutional neutral networks", } @Article{R:2018:PPS, author = "A. R. MV and P. K. Ghosh", title = "{PSFM} A Probabilistic Source Filter Model for Noise Robust Glottal Closure Instant Detection", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1645--1657", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2834733", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "all-pole filter coefficients; archivable priority list actual-word database database; Bernoulli Gaussian distribution; clean speech; computational complexity; database management systems; Dynamic programming; dynamic programming; exact GCI locations; filtering theory; Gaussian distribution; GCI detection; Gibbs sampling; glottal inverse filtering; Heuristic algorithms; N-best dynamic programming; noise robust GCI detection technique; noise robust glottal closure instant detection; Noise robustness; pathological speech; pitch synchronous speech analysis; Probabilistic logic; probabilistic source-filter model; probability; prosody modifications; PSFM; second-order statistics; Signal to noise ratio; signal-to-noise ratio levels; Speech processing; speech processing; voiced speech", } @Article{Airaksinen:2018:CBS, author = "M. Airaksinen and L. Juvela and B. Bollepalli and J. Yamagishi and P. Alku", title = "A Comparison Between {STRAIGHT}, Glottal, and Sinusoidal Vocoding in Statistical Parametric Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1658--1670", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2835720", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; Acoustics; analysis-synthesis; crowd-sourced listening test; formal test; glottal vocoding; GlottDNN; mixed excitation vocoders; PML; Predictive models; Production; pulse model in log-domain; shared envelope model; sinusoidal vocoding; speech coding; Speech synthesis; speech synthesis; Speech synthesis; speech waveform; statistical analysis; statistical parametric speech synthesis; statistical parametric speech synthesis framework; straight vocoding; synthesized speech quality; text-to-speech synthesis; Transfer functions; TTS synthesis; vocoder; vocoder quality; vocoder-specific features; vocoders; Vocoders; waveform generation method", } @Article{Mahe:2018:PCR, author = "G. Mah{\'e} and M. Ja{\"\i}dane", title = "Perceptually Controlled Reshaping of Sound Histograms", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1671--1683", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2836143", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio processing algorithms; audio signal processing; filtering theory; flat-spectrum version; frequency masking model; Frequency-domain analysis; generic algorithm; HGR; histogram global reshaping; histogram local reshaping; histogram low-pass filtering; Histograms; inaudible noise; iterative methods; low-pass filtering; low-pass filters; low-power white noise; noise audibility; noise audibility control; optimal performance; quantisation (signal); Quantization (signal); quantization theorem; Shape; signal-plus-noise mixture; Sound histogram equalization; sound histograms; sound reshaping; Source separation; source separation; sparsification; specific signal statistical distributions; Speech processing; statistical distributions; target histogram; Time-domain analysis; white noise", } @Article{Huang:2018:TSS, author = "Q. Huang and L. Zhang and Y. Fang", title = "Two-Step Spherical Harmonics {ESPRIT}-Type Algorithms and Performance Analysis", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1684--1697", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2836436", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "array signal processing; complex spherical harmonics domain; computational complexity; decomposition; Direction-of-arrival (DOA) estimation; direction-of-arrival estimation; DOA estimation; eigenvalue decomposition; eigenvalues and eigenfunctions; esti-mation of signal parameter via rotational invariance technique (ESPRIT); EVD; high-resolution estimation of signal parameter via rotational invariance technique; matrix algebra; mean square error (MSE); mean square error methods; mean square errors; MSE; parameter estimation; real-valued two-step SHESPRIT; semiRTS-SHESPRIT method; signal resolution; spherical array; spherical arrays; TS-SHESPRIT; two-step method; two-step spherical harmonics ESPRIT-type algorithms; unitary transformation", } @Article{Anonymous:2018:IATg, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1698--1699", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855927", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ITMg, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "1700--1702", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855929", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPn, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "C3--C3", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855931", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:BPg, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "26", number = "9", pages = "C4--C4", month = sep, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855933", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:FCh, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "C1--C1", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855939", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPo, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "C2--C2", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855941", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCi, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1698--1699", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855943", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCEi, author = "Anonymous", title = "Table of Contents [Edics]", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1700--1701", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855945", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2018:SSS, author = "D. Wang and J. Chen", title = "Supervised Speech Separation Based on Deep Learning: an Overview", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1702--1726", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2842159", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "array separation; beamforming; deep learning; deep neural networks; Interference; learning (artificial intelligence); multitalker separation; Noise measurement; Seech separation; speaker separation; speech dereverberation; Speech enhancement; speech enhancement; speech intelligibility; speech-nonspeech separation; Supervised learning; supervised learning problem; supervised separation algorithms; supervised speech separation; target speech; Task analysis; time-frequency masking; Training", } @Article{Wang:2018:SSWb, author = "R. Wang and M. Utiyama and A. Finch and L. Liu and K. Chen and E. Sumita", title = "Sentence Selection and Weighting for Neural Machine Translation Domain Adaptation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1727--1741", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2837223", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Adaptation models; conventional phrase-based machine translation; Decoding; domain adaptation; domain adaptation techniques; domain tags; domain weighting; domain-specific tasks; dynamic training methods; in-domain corpus; language translation; learning (artificial intelligence); machine translation tasks; multidomain sentence; natural language processing; Neural machine translation; neural machine translation domain adaptation; NMT domain problem; NMT internal sentence embedding; NMT performance; NMT training; out-of-domain corpora; out-of-domain sentences; real-world NMT scenario; sentence embedding similarity; sentence level NMT domain adaptation; sentence selection; sentence weighting methods; Speech processing; statistical analysis; Task analysis; Testing; Training; Training data; translation performance", } @Article{Khan:2018:UVS, author = "F. U. Khan and B. P. Milner and T. {Le Cornu}", title = "Using Visual Speech Information in Masking Methods for Audio Speaker Separation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1742--1754", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2835719", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio feature space; audio information; audio mask; audio ratio; audio signal processing; audio speaker separation; audio-masking-based speaker separation; audio-visual masking methods; audio-visual masks; audio-visual processing; audio-visual ratio masks; binary masks; Cameras; deep neural network; Estimation; feature extraction; Feature extraction; intelligibility tests; Lips; masking methods; neural nets; ratio mask; speaker recognition; Speaker separation; speech intelligibility; speech mixture; speech processing; Speech processing; speech quality; target speech; Time-frequency analysis; visual information; visual speech features; visual speech information; visual-only methods; Visualization; visually derived binary mask estimation; visually derived ratio mask estimation", } @Article{Li:2018:MIN, author = "X. Li and S. Gannot and L. Girin and R. Horaud", title = "Multichannel Identification and Nonnegative Equalization for Dereverberation and Noise Reduction Based on Convolutive Transfer Function", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1755--1768", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2839362", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; additive noise; Additive noise; Blind equalizers; blind multichannel identification; blind room impulse response identification; blind source separation; common zeros problem; complex-valued convolution model; complex-valued CTFs; convolution; Convolution; convolutive transfer function; CTF magnitude; dereverberation; equalisers; filtering theory; Fourier transforms; frequency aliasing; frequency response; Frequency response; joint speech dereverberation; long impulse responses; Microphones; microphones; multichannel equalization; Multichannel identification; near-common zeros; noise power related tolerance; Noise reduction; noise reduction; nonflat frequency response; nonnegative convolution model; nonnegative equalization; nonnegative multichannel equalization method; oversampled signals; oversampled STFT; reverberation; short-time Fourier; signal sampling; source signal; STFT framework; STFT magnitude; STFT window; Time-domain analysis; time-domain analysis; time-domain cross-relation method; time-domain impulse response; transfer functions; transient response", } @Article{enel:2018:SSI, author = "L{\"u}tfi Kerem {\c{S}}enel and {\.I}hsan Utlu and Veysel Y{\"u}cesoy and Aykut Ko{\c{c}} and Tolga {\c{C}}ukur", title = "Semantic Structure and Interpretability of Word Embeddings", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1769--1779", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2837384", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Interpretability; latent semantic structure; natural language processing; Natural language processing; natural language processing; NLP; semantic relations; semantic structure; Semantics; Sparse matrices; Speech processing; Standards; Statistical analysis; Task analysis; vector spaces; word embeddings; word embeddings interpretability; word intrusion test", } @Article{Koizumi:2018:DBS, author = "Y. Koizumi and K. Niwa and Y. Hioka and K. Kobayashi and Y. Haneda", title = "{DNN}-Based Source Enhancement to Increase Objective Sound Quality Assessment Score", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1780--1792", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2842156", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "backpropagation; black-box-optimization scheme; deep learning; deep neural network based source enhancement; DNN optimization scheme; Estimation; gradient methods; high OSQA scores; high-quality output signals; learning (artificial intelligence); Linear programming; mean square error methods; neural nets; objective sound quality assessment (OSQA) score; objective sound quality assessment score; optimisation; Optimization; policy gradient method; probability; Quality assessment; sound-quality evaluation; Sound-source enhancement; speech enhancement; Speech processing; Time-frequency analysis; time-frequency mask; Training", } @Article{Paleologu:2018:LSI, author = "C. Paleologu and J. Benesty and S. Ciochin{\u{a}}", title = "Linear System Identification Based on a {Kronecker} Product Decomposition", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1793--1808", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2842146", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic impulse responses; acoustic signal processing; approximation theory; Convergence; echo cancelation perspective; echo cancelers; echo cancellation; Echo cancellers; echo paths; echo suppression; filtering theory; identification; impulse response decomposition; iterative algorithm; Iterative methods; iterative methods; iterative Wiener filter; linear system identification; Linear systems; linear systems; long length impulse responses; Matrix decomposition; nearest Kronecker product; nearest Kronecker product decomposition; optimal impulse responseapproximation; Speech processing; statistical analysis; statistics estimation; System identification; system identification problem; transient response; Wiener filter; Wiener filters", } @Article{Xiong:2018:EAI, author = "F. Xiong and S. Goetze and B. Kollmeier and B. T. Meyer", title = "Exploring Auditory-Inspired Acoustic Features for Room Acoustic Parameter Estimation From Monaural Speech", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1809--1820", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2843537", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic characterisation; acoustic environments; acoustic features; acoustic noise; acoustic signal processing; architectural acoustics; artificial neural network; auditory-inspired acoustic features; automatic speech recognition; blind estimation; blind ROom Parameter Estimator; channel bank filters; early-to-late reverberation ratio; ELR estimation; Estimation; Frequency modulation; fullband signals; improved fullband estimations; individual filters; machine learning; monaural speech; neural nets; real-time applications; reverberant environments; reverberation; Reverberation; reverberation time; Reverberation time; room acoustic parameter estimation; room acoustic parameters; room impulse responses; ROPE model; ROPE performance; signal enhancement algorithms; single-microphone speech signals; spectral analysis; Speech enhancement; speech enhancement; speech recognition; speech time-frequency representation; speech variability; subband signals; temporal modulation filter bank; temporal modulation frequencies; time 3.0 s; transient response", } @Article{LeLan:2018:AMC, author = "G. {Le Lan} and D. Charlet and A. Larcher and S. Meignier", title = "An Adaptive Method for Cross-Recording Speaker Diarization", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1821--1832", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2844025", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic conditions; acoustic mismatch; Acoustics; Adaptation models; between-recording variability compensation methods; between-recording variability estimation; cross-recording DER; cross-recording speaker diarization; domain adaptation; Estimation; Hidden Markov models; initial training dataset; linking system; Mathematical model; out-of-domain data; Radio recordings; scalable unsupervised adaptation framework; Speaker diarization; speaker linking; speaker recognition; Task analysis; Training; unlabeled speakers; unsupervised learning; variable collection sizes", } @Article{Xue:2018:MDM, author = "W. Xue and A. H. Moore and M. Brookes and P. A. Naylor", title = "Modulation-Domain Multichannel {Kalman} Filtering for Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1833--1847", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2845665", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Array signal processing; Correlation; Estimation; Fourier transforms; inter-frame temporal evolution; interchannel spatial correlation; interframe temporal correlation; Kalman filtering; Kalman filters; microphone arrays; Microphones; modulation domain; modulation-domain multichannel Kalman filterng; multichannel KF; multichannel methods; Noise measurement; optimal filters; optimal MKF gain; second-order signal statistics; single-channel Kalman; single-channel modulation-domain KF; single-channel speech enhancement methods; Speech enhancement; speech enhancement; Speech enhancement; speech spectrum", } @Article{Wu:2018:MDE, author = "K. Wu and V. G. Reju and A. W. H. Khong", title = "Multisource {DOA} Estimation in a Reverberant Environment Using a Single Acoustic Vector Sensor", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1848--1859", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2845121", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; acoustic vector sensor; blind source separation; direction-of-arrival estimation; Direction-of-arrival estimation; direction-of-arrival estimation; DOA estimation; Estimation; Indexes; low-reverberant-single-source; LRSS detection; LRSS point detection; Microphones; multiple sources; multiple speech sources; multisource DOA estimation; multisource reverberant environments; reverberant environment; Reverberation; reverberation; Robot sensing systems; signal detection; single acoustic vector sensor; source signals; speech processing; TF domain; TF-point level; TF-zone level; time-frequency analysis; time-frequency domain", } @Article{Huang:2018:EHG, author = "J. Huang and Y. Sun and W. Zhang and H. Wang and T. Liu", title = "Entity Highlight Generation as Statistical and Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1860--1872", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2845111", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "attention mechanism; Computational modeling; copy mechanism; coverage mechanism; Decoding; decoding process; Entity highlight generation; entity highlight generation; entity name; entity-specific highlights; language translation; learning (artificial intelligence); Manuals; natural language processing; neural machine translation; neural nets; neural summarization; Seq2Seq approach; Seq2Seq model; sequence-to-sequence learning approach; Speech processing; statistical analysis; statistical machine translation; Task analysis; Training data; Web search", } @Article{Do:2018:SSM, author = "Q. T. Do and S. Sakti and S. Nakamura", title = "Sequence-to-Sequence Models for Emphasis Speech Translation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1873--1883", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2846402", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "emphasis estimation; Emphasis estimation; Emphasis Speech Translation Speech-to-speech translation systems; emphasis translation; emphasis translation task; Hidden Markov models; joint optimization; joint optimization of words and emphasis; joint translation model; language translation; Linguistics; natural language processing; optimisation; Optimization; Pipelines; Quantization (signal); S2ST systems; sequence translation tasks; sequence-to-sequence models; Speech processing; speech processing; speech synthesis; speech-to-speech translation (S2ST); Task analysis; translation models; translation performance", } @Article{Fontana:2018:EFP, author = "F. Fontana and E. Bozzo", title = "Explicit Fixed-Point Computation of Nonlinear Delay-Free Loop Filter Networks", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1884--1896", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2847442", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Computational modeling; delay-free loops; Digital delay-free loop; digital filters; discrete-time nonlinear filter networks; discrete-time realization; EMS VCS3 analog synthesizer; explicit fixed-point computation; fixed-point method; fixed-point search; fixed-point solvers; Integrated circuit modeling; iterative method; iterative methods; Mathematical model; Modulation; nonlinear delay-free loop filter networks; nonlinear differential equations; nonlinear filter network; nonlinear filters; Numerical models; ring modulator; RLC circuits; Speech processing; voltage-controlled filter; voltage-controlled oscillators", } @Article{Widmark:2018:CIA, author = "S. Widmark", title = "Causal {IIR} Audio Precompensator Filters Subject to Quadratic Constraints", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1897--1912", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2839355", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; causal IIR audio precompensator filters; computational complexity; control system synthesis; Convex functions; Delays; Design methodology; discrete time filters; discrete-time multiple-input multiple-output filter; feedforward; Finite impulse response filters; FIR filters; Frequency-domain analysis; gain control; IIR filters; impulse response Wiener filtering; infinite impulse response Wiener precompensator design; linear feedforward controller design; linear quadratic control; linear quadratic optimal; linear systems; Loudspeakers; optimization methods; Signal processing algorithms; Transfer functions; transient response; Wiener filters", } @Article{Winter:2018:CLW, author = "F. Winter and H. Wierstorf and C. Hold and F. Kr{\"u}ger and A. Raake and S. Spors", title = "Colouration in Local Wave Field Synthesis", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1913--1924", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2842435", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic field; acoustic signal processing; ambisonics; colouration; driving signals; emitted sound fields; extended listening area; Frequency-domain analysis; Harmonic analysis; hearing; listening experiments; local wave field synthesis; Loudspeakers; loudspeakers; Mathematical model; near-field-compensated higher order ambisonics; perceived colouration; Rendering (computer graphics); Sound field synthesis; sound field synthesis techniques; Speech processing; timbre; Timbre; wave field synthesis", } @Article{Andersen:2018:NSI, author = "A. H. Andersen and J. M. {de Haan} and Z. Tan and J. Jensen", title = "Nonintrusive Speech Intelligibility Prediction Using Convolutional Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1925--1939", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2847459", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Artificial intelligence; Auditory system; computational structure; convolution; Convolutional neural networks; convolutional neural networks; deep learning; learning (artificial intelligence); neural nets; Noise measurement; nonintrusive SIP algorithms; Nonintrusive speech intelligibility prediction; nonintrusive speech intelligibility prediction; Prediction algorithms; Signal processing algorithms; speech intelligibility; Speech processing; speech processing; speech processing algorithms; speech processing devices", } @Article{Anonymous:2018:IATh, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1940--1941", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855947", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ITMh, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "1942--1944", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855949", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPp, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "C3--C3", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855951", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:BPh, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "26", number = "10", pages = "C4--C4", month = oct, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855953", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:FCi, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "C1--C1", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880631", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPq, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "C2--C2", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2881067", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCj, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "1945--1946", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2867321", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCEj, author = "Anonymous", title = "Table of Contents [Edics]", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "1947--1948", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2867323", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hadian:2018:FSS, author = "H. Hadian and H. Sameti and D. Povey and S. Khudanpur", title = "Flat-Start Single-Stage Discriminatively Trained {HMM}-Based Models for {ASR}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "1949--1961", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2848701", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "automatic speech recognition; CD modeling approach; Context modeling; Databases; Decoding; discriminatively trained HMM-based models; flat-start; flat-start single-stage; Hidden Markov models; hidden Markov models; hidden Markov models-GMM models; Lattice-free; lattice-free maximum mutual information objective function; LF-MMI setup; Linear programming; maximum mutual information; Neural networks; regular tree-based CD modeling; single-stage; speech recognition; Training; tree-building steps; tree-free CD modeling technique; vocabulary continuous speech recognition", } @Article{Katzberg:2018:CSF, author = "F. Katzberg and R. Mazur and M. Maass and P. Koch and A. Mertins", title = "A Compressed Sensing Framework for Dynamic Sound-Field Measurements", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "1962--1975", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2851144", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "bandlimited signals; compressed sensing; Compressed sensing; compressed sensing framework; compressed sensing models; compressed sensing problem; compressed-sensing based recovery; dynamic sampling problem; dynamic sound-field measurement; dynamic sound-field measurements; Interpolation; interpolation; Linear systems; Mathematical model; microphone array; microphone positions; microphone trajectory; Microphones; modeled equidistant grid; modeled virtual grid; Nyquist-Shannon sampling theorem; random chosen trajectories; room impulse responses; sampling positions; signal reconstruction; signal sampling; sound-field variables; sparse Fourier representations; spatial sampling problem; spatio-temporal sampling problem; Speech processing; stationary microphones; sub-Nyquist sampling; suboptimally chosen trajectories; three-dimensional space; Trajectory; transient response; underdetermined sampling problems", } @Article{Sundar:2018:TBM, author = "H. Sundar and T. V. Sreenivas and C. S. Seelamantula", title = "{TDOA-Based} Multiple Acoustic Source Localization Without Association Ambiguity", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "1976--1990", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2851147", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; array signal processing; Delays; direction-of-arrival estimation; Direction-of-arrival estimation; GCC-PHAT; hyperboloid branches; IDIR; interhyperboloidal spatial region; inverse delay interval region; microphone arrays; microphone pairs; microphones; Microphones; multi-source localization; multiple acoustic source localization; multiple source localization; permutation problem; Position measurement; region-constrained localization; reverberation; Reverberation; reverberation; speaker recognition; Speech processing; TDOA; time-difference of arrival; time-differences of arrival; time-of-arrival estimation", } @Article{Sahraeian:2018:CET, author = "R. Sahraeian and D. {Van Compernolle}", title = "Cross-Entropy Training of {DNN} Ensemble Acoustic Models for Low-Resource {ASR}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "1991--2001", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2851145", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; Acoustics; cross-entropy objective function; cross-entropy training; Deep neural networks; DNN ensemble acoustic models; entropy; feature extraction; Feature extraction; Hidden Markov models; Interpolation; language-independent feature extractors; Low resource ASR; low-resource ASR; low-resource target language; model combination; multilingual deep neural networks; multilingual DNN acoustic model; multilingual DNN training; multilingual GlobalPhone dataset; natural language processing; neural nets; Neural networks; out-of-language data; speech recognition; Training; Training data; under-resourced languages", } @Article{Dinkel:2018:IRW, author = "H. Dinkel and Y. Qian and K. Yu", title = "Investigating Raw Wave Deep Neural Networks for End-to-End Speaker Spoofing Detection", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2002--2014", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2851155", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "ASV system; ASVspoof2015 dataset; automatic speaker verification; Biological neural networks; convolution; convolutional LSTM neural network; deep convolutional long short-term memory; Deep learning; end-to-end; end-to-end speaker spoofing detection; Feature extraction; feature extraction; feedforward neural nets; Machine learning; malicious spoofing attempts; Mel frequency cepstral coefficient; raw wave deep neural networks; recurrent neural nets; security of data; serious security breaches; speaker recognition; speaker verification; Speech processing; spoof-aware features; spoofing attack; spoofing detection; Task analysis; vanilla neural networks", } @Article{Zhang:2018:RDS, author = "J. Zhang and R. Heusdens and R. C. Hendriks", title = "Rate-Distributed Spatial Filtering Based Noise Reduction in Wireless Acoustic Sensor Networks", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2015--2026", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2851157", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic communication (telecommunication); acoustic signal processing; array signal processing; Bit rate; energy consumption; energy efficiency; energy usage; fusion center; LCMV beamforming; linearly constrained minimum variance beamformer; mathematical programming; microphone subset; Microphones; microphones; noise reduction; Noise reduction; noise reduction performance; Rate allocation; rate allocation strategy; rate-distributed spatial filtering; Resource management; semidefinite program; sensor selection; sensor-selection-based approaches; Sensors; signal statistics; sparsity; spatial filters; WASN; wireless acoustic sensor networks; Wireless communication; wireless sensor networks; Wireless sensor networks", } @Article{Heck:2018:DPM, author = "M. Heck and S. Sakti and S. Nakamura", title = "{Dirichlet} Process Mixture of Mixtures Model for Unsupervised Subword Modeling", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2027--2042", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2852500", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustic unit discovery; Acoustics; Bayesian nonparametrics; codebook; Convergence; Data models; Dirichlet process; Dirichlet process mixture; ergodic chain; Gibbs sampling; Hidden Markov models; Markov chain Monte Carlo sampler; Markov processes; Mixture models; mixture of mixtures; Monte Carlo methods; nonergodic Gibbs sampler; Speech processing; speech recognition; switch sampler; Switches; unsupervised subword modeling", } @Article{Nie:2018:DLB, author = "S. Nie and S. Liang and W. Liu and X. Zhang and J. Tao", title = "Deep Learning Based Speech Separation via {NMF}-Style Reconstructions", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2043--2055", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2851151", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "deep learning; deep neural network (DNN); deep neural networks; DNN; learning (artificial intelligence); Machine learning; magnitude spectrograms; matrix decomposition; neural nets; Neural networks; NMF-style reconstructions; Noise measurement; nonnegative matrix factorization; nonnegative matrix factorization (NMF); representation learning technique; spectro-temporal structures; Spectrogram; Speech enhancement; speech processing; Speech separation; speech separation; Training", } @Article{Dubey:2018:LFD, author = "H. Dubey and A. Sangwan and J. H. L. Hansen", title = "Leveraging Frequency-Dependent Kernel and {DIP}-Based Clustering for Robust Speech Activity Detection in Naturalistic Audio Streams", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2056--2071", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2848698", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio streaming; Clustering; CRSS long-duration naturalistic noise corpus; DARPA RATS; enhanced spectral decomposition; FDK statistical descriptors; feature extraction; frequency-dependent kernel; frequency-dependent kernel based SAD features; Gaussian mixture model; Gaussian processes; Hartigan dip test; Hartigan dip-based robust feature clustering; Kernel; learning (artificial intelligence); machine learning models; model-based approach; multiple noise-sources; naturalistic audio streams; NIST OpenSAD; NIST OpenSAT; NIST-OpenSAD-2015; NIST-OpenSAT-2017; one-dimensional FDK-SAD features; pattern clustering; peer-led team learning; principal component analysis; Rats; robust speech activity detection; Robustness; SAD annotations; semisupervised Gaussian mixture model; Signal to noise ratio; speaker recognition; speech activity detection; speech processing; Speech processing; standalone SAD evaluations; statistical analysis; supervised SAD; text-dependent speaker verification; Training; variable model-size Gaussian mixture model; VMGMM", } @Article{Jang:2018:CLN, author = "Y. Jang and J. Ham and B. Lee and K. Kim", title = "Cross-Language Neural Dialog State Tracker for Large Ontologies Using Hierarchical Attention", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2072--2082", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2852492", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "attention mechanism; attention-weighted word vector; cross language; cross-language adaptation; cross-language neural dialog state tracker; dialog management; Dialog state tracking; dialog state tracking challenge; hierarchical attention mechanism; interactive systems; language translation; learning (artificial intelligence); long short term memory; machine learning-based trackers; machine-translated training data; natural language processing; neural nets; Neural networks; Ontologies; ontologies (artificial intelligence); ontology; Predictive models; Speech processing; Task analysis; Training data; user intent identification; user utterances; vectors; Vocabulary; word processing", } @Article{Weisz:2018:SED, author = "G. Weisz and P. Budzianowski and P. Su and M. Ga{\v{s}}i{\'c}", title = "Sample Efficient Deep Reinforcement Learning for Dialogue Systems With Large Action Spaces", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2083--2097", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2851664", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "ACER algorithm; actor-critic methods; artificial intelligence; automated dialogue agents; deep reinforcement learning; Deep reinforcement learning; dialogue policy optimization; Gaussian processes; human computer interaction; human-computer interaction; interactive systems; learning (artificial intelligence); Learning (artificial intelligence); Markov processes; Neural networks; off-policy reinforcement learning; Optimization; policy optimization task; software agents; Speech processing; spoken dialogue systems; Task analysis; Training", } @Article{Lin:2018:RRL, author = "S. Lin", title = "Reverberation-Robust Localization of Speakers Using Distinct Speech Onsets and Multichannel Cross Correlations", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2098--2111", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2854871", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustic multisource localization; auditory filterbank; CASA; channel bank filters; concurrent speakers; correlation methods; Direction-of-arrival estimation; direction-of-arrival estimation; directions-of-arrival of speakers; encoded speech onsets; Harmonic analysis; impulse response models; microphone array recordings; microphone arrays; microphone signals; Microphones; multichannel cross correlation; multichannel cross correlations; multichannel cross-correlation coefficient; multiple microphones; onset detection; Psychoacoustic models; reverberant room; reverberation; Reverberation; reverberation; reverberation-robust localization; separate concurrent speakers; source separation; speaker localization methods; speaker recognition; Speech processing; speech signal; transforms; voice activity detection", } @Article{Abidin:2018:SAU, author = "S. Abidin and R. Togneri and F. Sohel", title = "Spectrotemporal Analysis Using Local Binary Pattern Variants for Acoustic Scene Classification", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2112--2121", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2854861", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustic scene; acoustic scene classification; acoustic signal processing; acoustic time-frequency images; capture acoustic scene information; constant-Q transform; CQT; Feature extraction; feature extraction; fusion; LBP; local binary pattern variants; local binary patterns; Mel frequency cepstral coefficient; Q-factor; signal classification; Spectrogram; temporal features; time frequency analysis; time-frequency analysis; Time-frequency analysis; time-frequency representation; transforms; Transforms; variable-Q transform; VQT", } @Article{Ma:2018:RBL, author = "N. Ma and J. A. Gonzalez and G. J. Brown", title = "Robust Binaural Localization of a Target Sound Source by Combining Spectral Source Models and Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2122--2131", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855960", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; Adaptation models; Auditory system; Azimuth; background model parameters; background source model; binaural sound localization; Binaural source localisation; biological spatial hearing; Biological system modeling; Computational modeling; deep neural networks; DNN-based localization system; feature extraction; hearing; localization process; machine hearing; machine hearing systems; masking; model adaptation process; model-based knowledge; neural nets; reverberation; robust binaural localization; room reverberation; sound localization performance; sound signals; sound source combination; source azimuth posteriors output; spectral analysis; spectral characteristics; spectral feature extraction; spectral source models; Speech processing; target sound source; target speech source; Time-frequency analysis", } @Article{Wu:2018:DDN, author = "S. Wu and D. Zhang and Z. Zhang and N. Yang and M. Li and M. Zhou", title = "Dependency-to-Dependency Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2132--2141", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2855968", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Computational modeling; Decoding; decoding; dependence parsing; dependence tree; encoder-decoder model; encoding; language translation; Magnetic heads; neural machine translation; NMT; novel sequence-to-dependence framework; Predictive models; recurrent neural nets; recurrent neural network; Recurrent neural networks; Syntactics; Syntax; syntax-aware encoder; target translation; Task analysis; translation quality; translation tasks; tree structure; trees (mathematics)", } @Article{Xu:2018:CDS, author = "J. Xu and H. He and X. Sun and X. Ren and S. Li", title = "Cross-Domain and Semisupervised Named Entity Recognition in {Chinese} Social Media: a Unified Model", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2142--2152", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2856625", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Chinese social media; Chinese social media language; cross-domain learning; domain similarity; in-domain supervised learning; in-domain unannotated information; in-domain unannotated text; Kernel; learning (artificial intelligence); massive unannotated text; Named entity recognition; natural language processing; out-of-domain corpora; Predictive models; semi-supervised learning; semisupervised learning; Semisupervised learning; semisupervised named entity recognition; Social network services; social networking (online); Speech processing; Task analysis; text analysis; Training", } @Article{VanKuyk:2018:EII, author = "S. {Van Kuyk} and W. B. Kleijn and R. C. Hendriks", title = "An Evaluation of Intrusive Instrumental Intelligibility Metrics", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2153--2166", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2856374", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "additive noise; Additive noise; CSII; Danish speech; Degradation; Distortion; Dutch speech; English speech; ESTOI; HASPI; HEGP; Indexes; instrumental measures; intelligibility data; Intelligibility prediction; intrusive instrumental intelligibility metrics; Measurement; MIKNN; monaural intrusive intelligibility metrics; NCM; QSTI; sEPSM; SIIB; SIMI; Speech enhancement; speech enhancement; speech intelligibility; statistical analysis; statistical dependencies; STOI", } @Article{Ouyang:2018:SPP, author = "X. Ouyang and K. Gu and P. Zhou", title = "Spatial Pyramid Pooling Mechanism in {3D} Convolutional Network for Sentence-Level Classification", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2167--2179", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2852502", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "3D CNN; 3D convolutional network; CNN; complicated internal relations; Computational modeling; convolution; convolutional neural network; Correlation; end-to-end language processing structure; Feature extraction; feature extraction; features extraction; feedforward neural nets; image processing; language processing; length sections; natural language processing; object detection; pattern classification; pooling processing; Recurrent neural networks; relation classification; Relation Classification; SemEval-2010 Task 8 dataset; Sentence Classification; sentence length variety; sentence-level classification; sentences vectors; spatial pyramid pooling mechanism; SPP; SPP structure; Task analysis; text analysis; textual data modeling; Three-dimensional displays; vectors", } @Article{McFee:2018:APO, author = "B. McFee and J. Salamon and J. P. Bello", title = "Adaptive Pooling Operators for Weakly Labeled Sound Event Detection", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2180--2193", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2858559", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "active sound sources; adaptive pooling operators; audio recording; audio recordings; audio signal processing; autopool; average-pooling; common pooling operators; convolutional neural networks; Data models; deep learning; dynamic annotations; Event detection; feedforward neural nets; human annotators; learning (artificial intelligence); machine learning; Machine learning; max-pooling; MIL problems; min-pooling; multiple instance learning; multiple instance learning problem; Predictive models; SED applications; SED methods; segment labeling; signal detection; Sound event detection; sound source; Standards; static prediction; strong annotations; supervised machine learning problem; Task analysis; temporally dynamic predictions; time-series label prediction; Training; training labels; weakly labeled sound event detection", } @Article{Barbancho:2018:DBA, author = "I. Barbancho and G. Tzanetakis and A. M. Barbancho and L. J. Tard{\'o}n", title = "Discrimination Between Ascending\slash Descending Pitch Arpeggios", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2194--2203", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2858538", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal analysis; acoustic signal processing; arpeggiated chord; ascending pitch arpeggios; audio signal processing; automatic music transcription; Automatic music transcription; cepstral analysis; classification; descending pitch arpeggios; expressiveness; feature extraction; features; Fisher linear discriminant classification scheme; high-pitched note; Instruments; Market research; Mel frequency cepstral coefficient; Mel-frequency cepstral coefficients; MFCC; music; Music; music information retrieval (MIR); musical instruments; pitch direction; playing technique; signal classification; Spectrogram; spectrogram; Speech processing; stroke and arpeggio analysis; support vector machines; SVM linear classification scheme; Task analysis", } @Article{Kim:2018:LSI, author = "Y. Kim and M. Kim and J. Goo and H. Kim", title = "Learning Self-Informed Feature Contribution for Deep Learning-Based Acoustic Modeling", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2204--2214", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2858923", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic model network; Acoustic modeling; acoustic signal processing; Acoustics; Artificial neural networks; auxiliary deep neural network; contribution gate outputs; deep learning; deep learning-based acoustic modeling; DNN; element-level discriminative contributions; FCN; feature contribution network; feature engineering approach; feature extraction; Feature extraction; gated features; Hidden Markov models; input feature contributions; learning (artificial intelligence); Logic gates; neural nets; regularization method; self-informed feature contribution learning; short-term memory-based AMNs; sigmoid-based contribution gates; speech recognition; Speech recognition; speech recognition; TED-LIUM release 1 corpus; Training", } @Article{Coteli:2018:MSS, author = "M. B. {\c{C}}{\"o}teli and O. Olgun and H. Hac{\i}habibo{\u{g}}lu", title = "Multiple Sound Source Localization With Steered Response Power Density and Hierarchical Grid Refinement", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2215--2229", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2858932", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic field; acoustic signal processing; array signal processing; associated signal-adaptive search method; compact spherical harmonic representation; Computational efficiency; direction-of-arrival estimation; Direction-of-arrival estimation; direction-of-arrival estimation; DOA estimation; Estimation; Harmonic analysis; hierarchical grid refinement; Microphone arrays; microphone arrays; multiple sound source localization; reverberation; rigid spherical microphone arrays; sound field analysis; Source localization; Speech processing; steered response power; steered response power density", } @Article{Bao:2018:QGD, author = "J. Bao and Y. Gong and N. Duan and M. Zhou and T. Zhao", title = "Question Generation With Doubly Adversarial Nets", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2230--2239", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2859777", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "adversarial procedures; artificial intelligence; Data models; DC-Dis; domain-classification discriminator; domain-general representations; DoubAN; doubly adversarial nets; doubly-adversarial net; Gallium nitride; generated questions; generated text-question pairs; Generators; Knowledge discovery; learning (artificial intelligence); natural language processing; neural networks; novel neural question generation approach; pattern classification; QA-Dis; Question generation; question generator; question-answering discriminator; sequence-to-sequence learning; source domains; source-domain labeled data; specific domain; target domain; target-domain unlabeled data; Task analysis; text analysis; Training; training data; Training data; unsupervised learning", } @Article{Bu:2018:DPF, author = "B. Bu and C. Bao and M. Jia", title = "Design of a Planar First-Order Loudspeaker Array for Global Active Noise Control", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2240--2250", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2852479", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; acoustic transducer arrays; Acoustics; active noise control; Active noise control; Attenuation; general first-order sources; general variable first-order responses; global active noise control; Harmonic analysis; Loudspeakers; loudspeakers; monopole component; noise abatement; Planar arrays; planar first-order loudspeaker array structure; planar loudspeaker array; planar loudspeaker arrays; primary noise field; sound field; sound reproduction; Speech processing; spherical harmonics; tangential dipole components; Three-dimensional displays; traditional spherical loudspeaker array", } @Article{Anonymous:2018:IATi, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2251--2252", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880636", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ITMi, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "2253--2255", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880638", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPr, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "C3--C3", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880640", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:BPi, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "26", number = "11", pages = "C4--C4", month = nov, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880642", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:FCj, author = "Anonymous", title = "Front Cover", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "C1--C1", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880612", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPu, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "C2--C2", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880683", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCk, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2251--2252", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2867353", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:TCEk, author = "Anonymous", title = "Table of Contents [Edics]", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2253--2254", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2867355", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2018:ISM, author = "X. Wang and Z. Tu and M. Zhang", title = "Incorporating Statistical Machine Translation Word Knowledge Into Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2255--2266", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2860287", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Chinese-to-Englishh translation; Decoding; English-to-German translation tasks; hybrid translation; Knowledge engineering; language translation; Modeling; natural language processing; Neural machine translation; neural machine translation; neural nets; neural network; neural network based classifier; Neural networks; NMT decoder; NMT decoding information; NMT word generation probability; probability; SMT word knowledge; SMT word recommendations; Speech processing; statistical analysis; Statistical learning; statistical machine translation; Training; translation combination; vocabulary; Vocabulary", } @Article{Zhao:2018:SSS, author = "Y. Zhao and M. Kuruvilla-Dugdale and M. Song", title = "Structured Sparse Spectral Transforms and Structural Measures for Voice Conversion", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2267--2276", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2860682", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "12 speaker pairs; Distortion; Distortion measurement; frequency warping; frequency-warping characteristic; high-D data; high-dimensional STRAIGHT spectra; Matrices; matrix decomposition; muffled speech; NMF; nonnegative matrix factorization; objective measures; overfit matrix; ROS; source-target speaker pair; Sparse matrices; spectral distortion; Speech processing; speech processing; structural measures; structure preservation; structured sparse spectral transform; structured sparse spectral transforms; temporal covariance; Training; transform matrix; Transforms; VC method; VC speech quality; voice conversion; Voice conversion; voice similarity", } @Article{Salehi:2018:LBR, author = "H. Salehi and D. Suelzle and P. Folkeard and V. Parsa", title = "Learning-Based Reference-Free Speech Quality Measures for Hearing Aid Applications", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2277--2288", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2860786", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; aid applications; amalgamates perceptual linear prediction; Auditory system; Band-pass filters; feature extraction; Feature extraction; feature set; frequency-shaped reference signal; full-reference HASQI performance; gammatone filterbank energies; HA output; HA quality ratings; HA recordings; hearing; hearing aid speech quality index; hearing aids; Hearing aids; hearing aids; HL-impacted gammatone auditory filterbank energies; HL-modified PLP coefficients; IIR filters; learning (artificial intelligence); loss modeling; Machine learning; machine learning; machine learning concepts; medical signal processing; objective measures; perceptual linear prediction; predicted quality scores; properly time-aligned; Quality assessment; reference-free HA speech quality indices; reference-free quality assessment; reference-free speech quality; regression analysis; speech enhancement; speech intelligibility; speech processing; Speech processing; speech quality; Support vector machines; support vector machines; support vector regression", } @Article{Enzner:2018:BMF, author = "G. Enzner and P. Th{\"u}ne", title = "{Bayesian} {MMSE} Filtering of Noisy Speech by {SNR} Marginalization With Global {PSD} Priors", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2289--2304", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2862641", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "a-posteriori SNR; additive noise; Bayes methods; Bayesian estimation; Bayesian MMSE filtering; complex speech spectral amplitudes; global distribution; global PSD priors; global SNR value; joint posterior distribution; latent speech power-spectral density; latent speech PSD state; latent time-varying a-priori SNR; latent Wiener filter; least mean squares methods; local data likelihood; MMSE estimation framework; Noise measurement; noisy speech; residual noise; Signal to noise ratio; single-channel speech enhancement; SNR marginalization; spectral analysis; speech enhancement; Speech enhancement; speech quality; speech-in-noise condition; speech-PSD posterior; stationary Wiener filters; statistical analysis; statistical estimators; Time-frequency analysis; Wiener filters", } @Article{Huang:2018:IFI, author = "G. Huang and J. Chen and J. Benesty", title = "Insights Into Frequency-Invariant Beamforming With Concentric Circular Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2305--2318", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2862826", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "array signal processing; Array signal processing; CCMA; circular microphone arrays; concentric circular microphone arrays; deep nulls problem; directivity factor; fixed and differential beamforming; frequency-invariant beamforming; frequency-invariant beampattern; Jacobi-Anger expansion; Jacobian matrices; Microphone arrays; microphone arrays; Microphone arrays; Nth-order symmetric beampatterns; Sensor arrays; Speech processing; white noise gain", } @Article{Ayana:2018:ZSC, author = "{Ayana} and S. Shen and Y. Chen and C. Yang and Z. Liu and M. Sun", title = "Zero-Shot Cross-Lingual Neural Headline Generation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2319--2327", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2842432", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "cross-lingual headline generation; Data models; direct source language articles; direct source-to-target CNHG model; English-Chinese headline generation evaluation datasets; headline generation; language translation; monolingual headline generation; natural language processing; Neural network; Neural networks; NHG systems; parameterized CNHG model; source document; Speech processing; summarization phases; target language headlines; text analysis; Training; Training data; zero-shot cross-lingual neural headline generation; zero-shot scenario", } @Article{Surendran:2018:OPC, author = "S. Surendran and T. K. Kumar", title = "Oblique Projection and Cepstral Subtraction in Signal Subspace Speech Enhancement for Colored Noise Reduction", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2328--2340", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2864535", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "additive noise subspace; cepstral domain; cepstral subtraction; clean speech signal; Colored noise; colored noise reduction; colored noise removal; Covariance matrices; Distortion; Masking property; matrix algebra; Noise measurement; noisy speech subspace; oblique projection; orthogonal noise subspace; residual noise; signal subspace approach; signal subspace speech enhancement; spectral domain constrained estimator; Speech enhancement; speech enhancement; speech enhancement methods; subspace speech enhancement method; variance normalization", } @Article{Li:2018:LKA, author = "Q. Li and D. F. Wong and L. S. Chao and M. Zhu and T. Xiao and J. Zhu and M. Zhang", title = "Linguistic Knowledge-Aware Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2341--2354", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2864648", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Attention gate; Decoding; Encoding; encoding; knowledge block; knowledge gate; knowledge-aware NMT approach; language translation; linguistic knowledge-aware neural machine translation; Linguistics; linguistics; natural language processing; neural machine translation (NMT); NMT encoder; recurrent neural nets; recurrent neural network; Recurrent neural networks; RNN encoder; Speech processing; syntactic information; Syntactics; word embeddings; word representation", } @Article{Zhang:2018:SNF, author = "W. Zhang and C. Hofmann and M. Buerger and T. D. Abhayapala and W. Kellermann", title = "Spatial Noise-Field Control With Online Secondary Path Modeling: a Wave-Domain Approach", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2355--2370", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2864577", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; active noise control; Active noise control; Active noise reduction; Adaptive algorithms; adaptive feedback control; adaptive processing; feedback; feedback system; least mean squares methods; loudspeakers; Loudspeakers; low-level auxiliary noise; microphone array placement; microphone arrays; Microphone arrays; multichannel active noise control; multichannel ANC; nonconcentric circular loudspeakers; online secondary path modeling; secondary path modelling; Sensors; spatial noise-field control; strong interchannel interference; tonal noise; Transforms; wave domain; wave-domain adaptation algorithm; wave-domain secondary path model", } @Article{Meynard:2018:SAN, author = "A. Meynard and B. Torr{\'e}sani", title = "Spectral Analysis for Nonstationary Audio", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2371--2380", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2862353", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Amplitude modulation; approximate maximum-likelihood approach; audio signal processing; deformation; Doppler effect; Gaussian processes; Gaussian stationary random signals; local spectrum; maximum likelihood estimation; nonstationary audio signals; Nonstationary signals; spectral analysis; Speech processing; stationarity-breaking operators; time warping; wavelet analysis; Wavelet analysis; wavelet transform domain; wavelet transforms; Wavelet transforms", } @Article{Martin-Morato:2018:AMT, author = "I. Mart{\'\i}n-Morat{\'o} and M. Cobos and F. J. Ferri", title = "Adaptive Mid-Term Representations for Robust Audio Event Classification", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2381--2392", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2865615", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic event detection; adaptive mid-term representations; alternative event representation; audio analysis tasks; Audio event classification; audio scene classification; audio signal processing; audio signals; distance-based texture windows; Event detection; event segmentation stage; feature extraction; Feature extraction; feature space; fixed-length feature vectors; fixed-length representation; Hidden Markov models; image classification; image segmentation; image texture; improved statistical description; low-level audio features; mid-term segments; mid-term statistics; nonlinear time normalization; robust audio event classification; robust mid-term statistical description; Robustness; sampling methods; short-term features; short-term temporal framing; Statistics; support vector machines; Support vector machines; temporal evolution; temporal information; temporal variability; trace-segmentation; uniform distance subsampling; variable length; vectors", } @Article{Firtha:2018:GRW, author = "G. Firtha and P. Fiala and F. Schultz and S. Spors", title = "On the General Relation of Wave Field Synthesis and Spectral Division Method for Linear Arrays", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2393--2403", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2865091", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic arrays; acoustic signal processing; appropriate boundary integral representation; arbitrary target sound field reproduction; arbitrary virtual sound field; densely spaced loudspeaker ensemble; explicit analytic method; explicit solution aims; extended listening area; Geometry; Green's function methods; high-frequency approximation; implicit analytic method; integral equation; Integral equations; integral equations; linear arrays; loudspeakers; Receivers; required loudspeaker driving functions; sound field synthesis; sound reproduction; spectral division method; spectral integral; Speech processing; target field specific synthesis scenarios; Three-dimensional displays; Two dimensional displays; Wave field synthesis; wave field synthesis", } @Article{Birkholz:2018:NIS, author = "P. Birkholz and S. Stone and K. Wolf and D. Plettemeier", title = "Non-Invasive Silent Phoneme Recognition Using Microwave Signals", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2404--2411", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2865609", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Antenna measurements; audible speech; electromagnetic transmission spectra; frequency 2.0 GHz to 12.0 GHz; k-nearest neighbors; linear discriminant analysis; microwave detectors; microwave signals; multiple phonetic contexts; nearest neighbour methods; noninvasive silent phoneme recognition; Radar antennas; Sensors; Silent-speech interface; silent-speech interfaces; silent-speech technology; Speech processing; Speech recognition; speech recognition; Speech synthesis; Vivaldi antennas", } @Article{Lin:2018:MVD, author = "W. Lin and M. Mak and J. Chien", title = "Multisource {I}-Vectors Domain Adaptation Using Maximum Mean Discrepancy Based Autoencoders", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2412--2422", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2866707", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Adaptation models; Covariance matrices; data distributions; domain adaptation; domain-invariant autoencoder; domainwise MMD; generalized MMD; i-vectors; i-vectors domain adaptation; learning (artificial intelligence); Machine learning; machine learning tasks; maximum mean discrepancy; maximum mean discrepancy based autoencoders; MMD-based autoencoders; multisource i-vector adaptation; multisource mismatch; NIST; probability distributions; Robustness; speaker recognition; Speaker verification; speaker verification systems; speech coding; Speech processing; statistical distributions; Training; Training data; vectors", } @Article{Abdelwahab:2018:DAA, author = "M. Abdelwahab and C. Busso", title = "Domain Adversarial for Acoustic Emotion Recognition", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2423--2435", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2867099", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic emotion recognition; acoustic signal processing; adversarial multitask training; adversarial training; data annotation; data distributions; Data models; data representations; deep neural network; domain adversarial; domain classifier; emotion recognition; Emotion recognition; emotion recognition performance; emotional classifiers; emotional dimensions; emotional-attribute-based descriptor prediction; gradient methods; gradient reversal layer; image classification; image representation; learning (artificial intelligence); neural nets; performance gap; shallow neural network; source domain; Speech emotion recognition; speech emotion recognition; Speech processing; speech recognition; Speech recognition; target domain representations; test domains; Testing; testing data; testing performance; Training; unlabeled adaptation of acoustic emotional models; unlabeled data", } @Article{ElBadawy:2018:DAO, author = "D. {El Badawy} and I. Dokmani{\'c}", title = "Direction of Arrival With One Microphone, a Few {LEGOs}, and Non-Negative Matrix Factorization", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2436--2446", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2867081", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; ad hoc scatterers; arbitrary scattering structure; direction of arrival estimation; direction-dependent way; direction-of-arrival estimation; Direction-of-arrival estimation; frequency response; group sparsity; inverse problem; inverse problems; learned nonnegative dictionaries; learning (artificial intelligence); LEGO bricks; localizing speech; matrix decomposition; Microphones; microphones; monaural localization; monaural speech localization algorithm; multisource localization; non-negative matrix factorization; nonnegative dictionaries; nonnegative matrix factorization; rudimentary structures; Scattering; single microphone; sound scattering; sound source localization; Speech processing; speech processing; unilateral hearing loss; universal speech model; white noise; White noise; white noise", } @Article{Lee:2018:ISC, author = "H. Lee and P. Chung and Y. Wu and T. Lin and T. Wen", title = "Interactive Spoken Content Retrieval by Deep Reinforcement Learning", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2447--2459", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2852739", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "content-based retrieval; deep reinforcement learning; deep-Q-learning; deep-Q-network; DQN; Feature extraction; hand-crafted states; interactive spoken content retrieval; interactive systems; Learning (artificial intelligence); learning (artificial intelligence); machine actions; Machine learning; Multimedia communication; reinforcement learning; Reinforcement learning; retrieval results; retrieved items; Speech processing; speech recognition; Speech recognition; Spoken content retrieval; text content retrieval; User interfaces; user-machine interaction", } @Article{Elshamy:2018:DSS, author = "S. Elshamy and N. Madhu and W. Tirry and T. Fingscheidt", title = "{DNN}-Supported Speech Enhancement With Cepstral Estimation of Both Excitation and Envelope", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2460--2474", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2867947", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "${a\; a priori SNR estimation; CEM technique; Cepstral analysis; cepstral domain; cepstral excitation manipulation technique; classical MMSE short time spectral amplitude estimator; clean envelope-representing coefficients; clean spectral envelopes; Deep learning; deep neural network approach; DNN-supported speech enhancement; filtering theory; hidden Markov model; Hidden Markov models; hidden Markov models; human speech production; least mean squares methods; neural nets; noise attenuation; Noise reduction; noise reduction framework; noisy conditions; priori}$SNR; Signal to noise ratio; source-filter model; spectral analysis; speech component; Speech enhancement; speech enhancement; speech spectral envelope-based noise reduction", } @Article{Bao:2018:CCP, author = "Y. Bao and H. Chen", title = "A Chance-Constrained Programming Approach to the Design of Robust Broadband Beamformers With Microphone Mismatches", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2475--2488", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2868416", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "array response distortion distribution property; array signal processing; Broadband beamformers; Broadband communication; CCP-based design problem; chance constraint probability; chance-constrained programming; chance-constrained programming based design approach; chance-constrained stopband level constraint; computational complexity; convex programming; Distortion; Microphone arrays; microphone arrays; microphone mismatches; NP-hard problem; Optimization; overconservatism problem; Passband; probability; relaxed convex optimization formulation; robust broadband beamformers; robustness; Robustness; WMPO-based design approaches; worst case mean performance optimization; worst-case mean performance optimization", } @Article{Anonymous:2018:FE, author = "Anonymous", title = "Farewell Editorial", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2489--2489", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2879265", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:LR, author = "Anonymous", title = "List of Reviewers", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2490--2496", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2879695", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "IEEE publishing", } @Article{Anonymous:2018:IATj, author = "Anonymous", title = "{{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Edics", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2497--2498", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880644", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ITMj, author = "Anonymous", title = "{{\booktitle{IEEE Transactions on Multimedia}}} information for authors", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2499--2501", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880646", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:IOA, author = "Anonymous", title = "{IEEE} Open Access Publishing", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2502--2502", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2882333", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:IIA, author = "Anonymous", title = "2018 Index {{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}} Vol. 26", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "2503--2528", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880685", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:ISPv, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "C3--C3", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880648", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2018:BPj, author = "Anonymous", title = "Blank page", journal = j-IEEE-ACM-TASLP, volume = "26", number = "12", pages = "C4--C4", month = dec, year = "2018", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880650", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCa, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "C1--1", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2883927", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:ISPa, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "C2--C2", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2883931", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCEa, author = "Anonymous", title = "Table of Contents [Edics]", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "2--3", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2883929", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:BP, author = "Anonymous", title = "[{Blank} page]", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "B4--B4", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2885939", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:IEI, author = "Anonymous", title = "Inaugural Editorial Innovations in an Era of Ubiquitous Audio, Speech, and Language Processing", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "5--6", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2884853", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bao:2019:NRM, author = "F. Bao and W. H. Abdulla", title = "A New Ratio Mask Representation for {CASA}-Based Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "7--19", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2868407", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "binary mask; CASA-based speech enhancement; channel bank filters; channel-weight contour; Computational auditory scene analysis (CASA); Correlation; deep neural networks (DNN); equal loudness hearing attribute; five-layer structured deep neural network; Gammatone filterbank channel; hearing; ICC; ideal ratio mask (IRM); inter-channel correlation; neural nets; Noise measurement; noise ratio conditions; ratio mask; ratio mask representation; revised ratio mask; Signal to noise ratio; source separation; spectral distortion; speech enhancement; Speech enhancement; speech enhancement; speech processing; speech quality; speech-noise power ratio; Standards; Training; Wiener filtering; Wiener filters", } @Article{Magron:2019:CIP, author = "P. Magron and T. Virtanen", title = "Complex {ISNMF}: a Phase-Aware Model for Monaural Audio Source Separation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "20--31", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2869684", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Adaptation models; anisotropic Gaussian model; audio signal processing; audio source separation; Bayes methods; Bayesian anisotropic Gaussian source model; Bayesian inference; circularly-symmetric Gaussian; complex ISNMF; complex Itakura-Saito NMF; complex NMF; Estimation; expectation-maximisation algorithm; Fourier transforms; Gaussian distribution; Gaussian processes; Itakura Saito divergence; Markov chain prior structure; matrix decomposition; monaural audio source separation; musical source separation task; nonisotropic variables; nonnegative matrix factorization; Nonnegative matrix factorization (NMF); phase constraints; phase recovery; phase-aware model; phase-aware probabilistic model; probability; Random variables; short-time Fourier transform domain; signal model; source separation; Source separation; Speech processing; state-of-the-art phase-aware separation techniques", } @Article{Duong:2019:GMB, author = "T. T. H. Duong and N. Q. K. Duong and P. C. Nguyen and C. Q. Nguyen", title = "{Gaussian} Modeling-Based Multichannel Audio Source Separation Exploiting Generic Source Spectral Model", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "32--43", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2869692", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio signal processing; blind audio source separation; blind source separation; covariance analysis; Covariance matrices; Electronic mail; expectation-maximisation algorithm; Frequency-domain analysis; Gaussian modeling-based multichannel audio source Separation; Gaussian processes; generalized expectation-minimization algorithm; generic source spectral model; generic spectral model; group sparsity constraint; intermediate source variances; local Gaussian model; matrix decomposition; Microphones; Multichannel audio source separation; multichannel source separation approach; NMF; nonnegative matrix factorization; Parameter estimation; parameter estimation; signal denoising; single-channel audio mixtures; Source separation; source spatial covariance model; source variance denoising; Speech processing; speech processing; unified Gaussian modeling framework", } @Article{Zhang:2019:DTC, author = "G. Zhang and J. Tao and X. Qiu and I. Burnett", title = "Decentralized Two-Channel Active Noise Control for Single Frequency by Shaping Matrix Eigenvalues", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "44--52", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2869686", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "active noise control; Active noise control (ANC); active noise control system; adaptive controller; centralized approaches; centralized controller; Computational complexity; computational complexity; Convergence; Decentralized control; decentralized control scheme; decentralized controller; decentralized two-channel active noise control; Eigenvalues and eigenfunctions; eigenvalues and eigenfunctions; error microphone; error microphones; frequency domain; matrix algebra; matrix eigenvalues; Microphones; microphones; multiple secondary sources; noise disturbance; Noise reduction; noise reduction performance; Process control; small-size ANC subsystems; two-channel ANC system; two-channel secondary paths", } @Article{Zhao:2019:TSD, author = "Y. Zhao and Z. Wang and D. Wang", title = "Two-Stage Deep Learning for Noisy-Reverberant Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "53--62", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2870725", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "automatic speech; background noise; deep neural networks; Deep neural networks; denoising; dereverberation; ideal ratio mask; iterative methods; iterative phase reconstruction; learning (artificial intelligence); Linear programming; neural nets; Noise measurement; Noise reduction; noisy-reverberant speech enhancement; objective function; one-stage enhancement systems; phase; phase estimates; reverberation; Reverberation; room reverberation; signal reconstruction; speaker recognition; spectral magnitudes estimation; speech denoising; speech dereverberation; Speech enhancement; speech enhancement; speech intelligibility; speech quality; Time-domain analysis; Training; two-stage deep learning; two-stage model", } @Article{Zheng:2019:PAS, author = "N. Zheng and X. Zhang", title = "Phase-Aware Speech Enhancement Based on Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "63--76", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2870742", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "corresponding magnitude spectrogram; Deep neural network (DNN); deep neural networks; DNN-based methods; Fourier transforms; harmonic model; incorporating phase; instantaneous frequency; instantaneous frequency deviation; learning (artificial intelligence); neural nets; Noise measurement; phase estimation; phase processing; phase-aware speech enhancement algorithm; radio applications; short-time frequency; Spectrogram; speech enhancement; Speech enhancement; speech enhancement; speech recognition; speech-processing algorithms; STFT magnitude; telecommunication; Time-frequency analysis; time-frequency analysis; Training; unstructured phase spectrogram; unstructured STFT phase; Wrapping", } @Article{Moriya:2019:ESB, author = "T. Moriya and T. Tanaka and T. Shinozaki and S. Watanabe and K. Duh", title = "Evolution-Strategy-Based Automation of System Development for High-Performance Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "77--88", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2871755", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "cloud computers; cloud computing; covariance matrix adaptation evolution strategy (CMA-ES); deep neural network; deep neural network (DNN); evolution-strategy-based automation; evolutionary computation; genetic algorithm; Genetic algorithms; hidden Markov model; hidden Markov models; Hidden Markov models; high-performance speech recognition; large vocabulary speech recognition system; meta-parameters; multi-objective optimization; multiobjective Pareto optimization; neural nets; Optimization; parallel computation; parallel processing; Pareto optimisation; Speech processing; Speech recognition; speech recognition; system development; Training; Vocabulary; word error rate", } @Article{Kamper:2019:SSR, author = "H. Kamper and G. Shakhnarovich and K. Livescu", title = "Semantic Speech Retrieval With a Visually Grounded Model of Untranscribed Speech", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "89--98", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2872106", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Analytical models; automatic speech recognition; Data models; external image tagger; human semantic relevance judgements; information retrieval; keyword spotting; learning (artificial intelligence); multimodal modelling; natural language processing; neural model; neural nets; nonverbatim semantic matches; parallel speech; Predictive models; semantic retrieval; semantic speech retrieval; Semantics; speech processing; Speech processing; speech recognition; speech retrieval; Task analysis; unlabelled speech; untranscribed speech; visual context; Visual grounding; Visualization; visually grounded speech model", } @Article{Kavalekalam:2019:MBS, author = "M. S. Kavalekalam and J. K. Nielsen and J. B. Boldt and M. G. Christensen", title = "Model-Based Speech Enhancement for Intelligibility Improvement in Binaural Hearing Aids", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "99--113", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2872128", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic scenarios representative; acoustic signal processing; autoregressive model; binaural codebook-based method; binaural enhancement; binaural hearing aids; binaural speech enhancement framework; clean speech pitch parameters; cocktail party scenario; directional pitch estimator; Ear; enhancement process; Estimation; filter parameters; harmonic model; hearing aid technology; hearing aids; hearing impaired individuals; intelligibility improvement; Kalman filter; Kalman filters; Mathematical model; maximum likelihood estimation; maximum likelihood principle; model-based speech enhancement; Noise measurement; normal hearing subjects; pitch estimation; pitch parameters; robust estimation; Speech enhancement; speech enhancement; speech intelligibility; speech production dynamics; speech production model; speech quality; STP parameters", } @Article{R:2019:GIF, author = "A. R. MV and P. K. Ghosh", title = "Glottal Inverse Filtering Using Probabilistic Weighted Linear Prediction", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "114--124", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2873897", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "all-pole filter; Computational modeling; Data models; filter coefficients; filtering theory; Gibbs sampling; GIF; glottal closure; glottal cycle; glottal flow estimate; glottal inverse filtering; Glottal inverse filtering; Indexes; Lijencrants-Fant model; Lips; physical model; probabilistic interpretation; Probabilistic logic; probabilistic temporal weighting; probabilistic weighted linear prediction; probability; Random variables; speech data; speech processing; Speech processing; synthetic data", } @Article{Sun:2019:TSM, author = "Y. Sun and W. Wang and J. Chambers and S. M. Naqvi", title = "Two-Stage Monaural Source Separation in Reverberant Room Environments Using Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "125--139", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2874708", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; current state-of-the-art methods; deep neural networks; Deep neural networks; dereverberant speech mixture; dereverberation mask; DM; DNN-based method; highly reverberant room environments; ideal enhanced mask; ideal ratio mask; IEM; Interference; IRM; monaural source separation; monaural source separation problem; neural nets; Neural networks; Noise measurement; NOISEX dataset; reverberant room environments; reverberation; Reverberation; room impulse responses; single DNN; source separation; Source separation; speech intelligibility; speech mixture dereverberation; speech processing; Speech processing; TIMIT corpora; Training; transient response; two-stage approach; two-stage monaural source separation", } @Article{Ferrer:2019:TFS, author = "L. Ferrer and M. K. Nandwana and M. McLaren and D. Castan and A. Lawson", title = "Toward Fail-Safe Speaker Recognition: Trial-Based Calibration With a Reject Option", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "140--153", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2875794", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Bayes methods; calibration; Calibration; calibration loss; calibration step; candidate training; Computational modeling; Data models; evaluation conditions; forensic voice comparison; Forensics; Gaussian processes; learning (artificial intelligence); Logistics; matched calibration data; matched data; reject option; relevant calibration data; separate calibration model; Speaker recognition; speaker recognition; speaker recognition systems; standard calibration approach; TBC method; toward fail-safe speaker recognition; Training; training data; trial-based calibration", } @Article{Amini:2019:ACR, author = "J. Amini and R. C. Hendriks and R. Heusdens and M. Guo and J. Jensen", title = "Asymmetric Coding for Rate-Constrained Noise Reduction in Binaural Hearing Aids", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "154--167", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2876172", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "advanced noise reduction algorithms; Array signal processing; asymmetric coding; asymmetric sequential coding scheme; binaural hearing aids; Binaural hearing aids (HAs); complete joint noisy signal statistics; hearing aids; information bit-rate; mean square error distortion measure; mean square error methods; medical signal processing; microphones; Microphones; monaural beamforming; monaural-bilateral HA; multi-microphone noise reduction; Noise measurement; Noise reduction; optimal rate-constrained beamforming strategy; Quantization (signal); rate-constrained noise reduction; remote source coding; sequential codes; signal denoising; Source coding; speech coding; sub-optimal rate; sub-optimal strategies; transmission capacities", } @Article{Yu:2019:GIA, author = "J. Yu and J. Jiang and R. Xia", title = "Global Inference for Aspect and Opinion Terms Co-Extraction Based on Multi-Task Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "168--177", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2875170", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "aspect term extraction; aspect terms; Benchmark testing; data mining; global inference approach; global inference method; inference mechanisms; inter-task relationship; Labeling; learning (artificial intelligence); multitask learning framework; multitask neural networks; Natural language processing; neural nets; neural network architectures; Neural networks; neural networks; neural predictions; opinion mining; opinion term extraction; opinion terms co-extraction; Sentiment analysis; sentiment analysis; Standards; syntactic constraints; syntactic relations; Syntactics; Task analysis", } @Article{Wang:2019:RSL, author = "Z. Wang and X. Zhang and D. Wang", title = "Robust Speaker Localization Guided by Deep Learning-Based Time-Frequency Masking", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "178--188", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2876169", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic noise; acoustic signal processing; audio signal processing; conventional localization algorithms; deep learning-based time-frequency masking; deep neural networks; Delay effects; direction of arrival estimation; Direction-of-arrival estimation; direction-of-arrival estimation; Estimation; GCC-PHAT; generalized cross correlation; ideal ratio mask; intense noise; learning (artificial intelligence); Microphones; microphones; monaural spectral information; monaural speech enhancement; monaural speech separation; neural nets; noisy environments; reverberant environments; Reverberation; robust speaker localization; room reverberation; Signal processing algorithms; Signal to noise ratio; single-channel; speech dominant T-F units; speech processing; steered-response power; steering vectors; time-frequency analysis; time-frequency masking; traditional DOA estimation methods; trained model", } @Article{Tan:2019:GRN, author = "K. Tan and J. Chen and D. Wang", title = "Gated Residual Networks With Dilated Convolutions for Monaural Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "189--198", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2876171", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "bidirectional LSTM model; CNN model; contextual information; Convolution; convolutional neural network architecture; deep neural networks; dilated convolutions; Dilated convolutions; feedforward neural nets; gated linear units; gated residual networks; gating mechanisms; generalisation (artificial intelligence); learning (artificial intelligence); Logic gates; long-term contexts; mask estimation; monaural speech enhancement; Noise measurement; objective speech intelligibility; quality metrics; recurrent neural nets; residual learning; sequence-to-sequence mapping; Signal to noise ratio; spectral mapping; speech enhancement; Speech enhancement; speech enhancement; speech intelligibility; supervised speech enhancement; systematic context aggregation; target speaker tracking; temporal contexts; Training; unidirectional long short-term memory; unidirectional LSTM model", } @Article{Ngo:2019:PAS, author = "G. H. Ngo and M. Nguyen and N. F. Chen", title = "Phonology-Augmented Statistical Framework for Machine Transliteration Using Limited Linguistic Resources", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "199--211", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2875269", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "consonant cluster; cross-lingual information retrieval; Data models; foreign word; language translation; linguistic resources; linguistics; machine translation; machine transliteration; named entity recognition; natural language processing; Phonetics; phonological structure; phonology-augmented statistical framework; source language; Speech processing; Standards; statistical analysis; statistical transliteration approaches; target languages phonology; Task analysis; Training; Training data; Transliteration; transliteration system", } @Article{Koizumi:2019:UDA, author = "Y. Koizumi and S. Saito and H. Uematsu and Y. Kawachi and N. Harada", title = "Unsupervised Detection of Anomalous Sound Based on Deep Learning and the {Neyman--Pearson} Lemma", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "212--224", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2877258", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal detection; and autoencoder; anomalous sound; Anomaly detection in sound; anomaly score; deep learning; Feature extraction; learning (artificial intelligence); Linear programming; Neyman-Pearson lemma; optimisation; Probability density function; reconstruction error; sampling methods; security of data; simulate anomalous sounds; Speech processing; statistical analysis; Task analysis; Training data; true positive rate; unknown anomalous sounds; unsupervised anomaly detection; unsupervised detection; unsupervised learning; unsupervised-ADS", } @Article{Laufer:2019:BHM, author = "Y. Laufer and S. Gannot", title = "A {Bayesian} Hierarchical Model for Speech Enhancement With Time-Varying Audio Channel", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "225--239", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2876177", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic channel; Acoustics; Adaptive beamforming; array signal processing; audio signal processing; Bayes methods; Bayesian hierarchical model; channel alignment; channel estimate; Covariance matrices; expectation-maximisation algorithm; filtering theory; fully Bayesian hierarchical approach; Gaussian processes; Heuristic algorithms; Kalman filters; Kalman smoother; Microphones; multichannel linear-Gaussian state-space model; multichannel minimum variance distortionless response beamformer; multichannel speech enhancement; multichannel Wiener filter; MVDR beamformer; noise precision matrix; noisy signal; probabilistic approach; probability; reverberation; reverberation levels; single-channel variational postfilter; Speech enhancement; speech enhancement; speech precision; speech quality; speech signal; time-varying audio channel; tracking ability; variational EM; variational expectation-maximization algorithm; VEM speech estimator; Wiener filters", } @Article{Anonymous:2019:ENA, author = "Anonymous", title = "Erratum for Nonlinear Audio Systems Identification Through Audio Input {Gaussianization}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "240--240", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2875325", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Audio systems; Nonlinear systems; Speech processing", } @Article{Anonymous:2019:ISPb, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "1", pages = "C3--C3", month = jan, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2887012", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCb, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "C1--241", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2883933", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:ISPc, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "C2--C2", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2883937", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCc, author = "Anonymous", title = "Table of {Contents[Edics]}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "242--243", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2883935", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nakashika:2019:CVR, author = "T. Nakashika and S. Takaki and J. Yamagishi", title = "Complex-Valued Restricted {Boltzmann} Machine for Speaker-Dependent Speech Parameterization From Complex Spectra", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "244--254", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2877465", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Boltzmann machines; cepstral analysis; complex-valued data; complex-valued representation; complex-valued restricted Boltzmann machine; complex-valued spectra; contrastive divergence; CRBM; deep learning; Feature extraction; feature extraction; Gibbs sampling; hidden Markov models; learning (artificial intelligence); Mel frequency cepstral coefficient; Restricted Boltzmann machine; signal classification; speaker-dependent speech parameterization; speech processing; Speech processing; Speech recognition; speech recognition; speech signal processing; speech synthesis; Task analysis", } @Article{Xiong:2019:JER, author = "F. Xiong and S. Goetze and B. Kollmeier and B. T. Meyer", title = "Joint Estimation of Reverberation Time and Early-To-Late Reverberation Ratio From Single-Channel Speech Signals", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "255--267", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2877894", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic characterization; acoustic observations; acoustic room environment characterization; acoustic signal processing; architectural acoustics; artificial neural network; auditory-inspired acoustic features; blind estimation methods; early-to-late reverberation ratio; ELR classes; ELR estimation; ELR simultaneously; Estimation; extreme reverberant conditions; Feature extraction; joint estimation; joint room parameter estimator; learning (artificial intelligence); Modulation; multi-task learning; multitask learning; neural nets; noisy environments; parameter estimation; Reverberation; reverberation; Reverberation time; reverberation time; signal representation; single-channel speech signals; single-task ROPE system; speech processing; Speech processing; speech time-frequency representations; statistical distributions; sub-band frequency data; subband signals; temporal modulation features; temporal modulation filtering; Time-frequency analysis", } @Article{Stoter:2019:CEN, author = "F. St{\"o}ter and S. Chakrabarty and B. Edler and E. A. P. Habets", title = "{CountNet}: Estimating the Number of Concurrent Speakers Using Supervised Learning", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "268--282", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2877892", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio surveillance; audio-based tasks; blind source separation; cocktail-party; complementary aspects; concurrent speakers; convolutional recurrent neural networks; deep architectures; deep neural network architectures; discrete point estimates; Estimation; learning (artificial intelligence); maximum number; Microphones; Neural networks; number of concurrent speakers; output posterior distributions; overlap detection; probability; recurrent neural nets; single-channel mixtures; Speaker count estimation; speaker count estimation; speaker diarization; speech mixtures; speech processing; Speech processing; supervised learning; Surveillance; Task analysis; unifying probabilistic paradigm", } @Article{Kolbaek:2019:RBS, author = "M. Kolb{\ae}k and Z. Tan and J. Jensen", title = "On the Relationship Between Short-Time Objective Intelligibility and Short-Time Spectral-Amplitude Mean-Square Error for Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "283--295", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2877909", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Auditory system; Correlation; correlation theory; deep neural network based speech enhancement algorithms; deep neural networks; DNN training criterion; DNN-based speech enhancement algorithms; envelope linear correlation; improved speech intelligibility performance; least mean squares methods; mean-square error criterion; minimum mean-square error estimator; neural nets; Noise measurement; noisy speech; short-time objective intelligibility; short-time spectral amplitudes; short-time spectral-amplitude; Signal processing algorithms; Speech enhancement; speech enhancement; Speech enhancement; speech intelligibility; speech temporal envelopes; standard STSA minimum-MSE estimator; state-of-the-art speech intelligibility estimator; STOI speech intelligibility estimator; STSA-MSE criterion; Time-frequency analysis", } @Article{Hansen:2019:EFF, author = "M. W. Hansen and J. R. Jensen and M. G. Christensen", title = "Estimation of Fundamental Frequencies in Stereophonic Music Mixtures", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "296--310", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2878384", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; audio signal processing; Delays; Estimation; expectation-maximisation algorithm; Frequency estimation; fundamental frequency estimation; Gaussian sources; harmonic amplitude vectors; Harmonic analysis; harmonic mixture components; instrument recordings; Instruments; least squares approximations; mixing parameters; model selection; multi-channel pitch estimation; Multi-pitch estimation; multipitch estimation problem; Multiple signal classification; music; music information retrieval; overlapping harmonics; panning parameters; pitch estimation problem; recording studio; signal model; Speech processing; stereophonic music mixtures; sterephonic signal analysis; vector quantization", } @Article{Bao:2019:TGT, author = "J. Bao and D. Tang and N. Duan and Z. Yan and M. Zhou and T. Zhao", title = "Text Generation From Tables", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "311--320", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2878381", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "artificial intelligence; BLEU-4 scores; continuous vectors; Decoding; descriptive sentences; Encyclopedias; flexible copying mechanism; language model based approaches; natural language processing; natural language sentence; Natural languages; neural generative model; neural nets; neural network; Neural networks; search engine; Search engines; selective content replication; SIMPLEQUESTIONS dataset; Speech processing; table attributes; table caption; table cells; table semantics; table-query pairs; Table-to-text generation; Table2Seq; Table2Seq model; Task analysis; text analysis; text generation; WIKIBIO dataset; WIKITABLETEXT dataset", } @Article{Koutrouvelis:2019:CAR, author = "A. I. Koutrouvelis and R. C. Hendriks and R. Heusdens and J. Jensen", title = "A Convex Approximation of the Relaxed Binaural Beamforming Optimization Problem", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "321--331", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2878618", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustic distortion; acoustic signal processing; acoustic sources; approximation theory; Array signal processing; array signal processing; Binaural beamforming; binaural cues; binaural-cue distortions; binaural-cue preservation; computational complexity; concave programming; convex approximation; Convex functions; convex optimization; convex programming; distortion; frequency bin; hybrid methods; LCMV; lower computational complexity; multiple convex optimization problems; Noise reduction; noise reduction; noise suppression; nonconvex optimization problem; Optimization; output noise power; predicted intelligibility; RBB optimization problem; RBB problem; relaxed binaural beamforming optimization problem; SCO method; semi-definite relaxation; semidefinite convex relaxation; single convex optimization problem; suboptimal hybrid method; suboptimal method; suboptimal SDCR method; successive convex optimization method; Wiener filters", } @Article{Hashimoto:2019:MMC, author = "T. Hashimoto and D. Saito and N. Minematsu", title = "Many-to-Many and Completely Parallel-Data-Free Voice Conversion Based on Eigenspace {DNN}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "332--341", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2878949", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Adaptation models; conversion model; Data models; deep neural network; eigenspace DNN; eigenvalues and eigenfunctions; eigenvoice; eigenvoice Gaussian mixture models; Gaussian mixture model; Gaussian mixture models; Gaussian processes; many-to-many conversion; many-to-many voice conversion; mixture models; neural nets; parallel processing; parallel-data-free; parallel-data-free voice conversion; prestored parallel data; pseudoparallel data; speaker features; speaker recognition; speaker space; Speech processing; Task analysis; Training; Voice conversion; voice conversion models", } @Article{Pishdadian:2019:MRC, author = "F. Pishdadian and B. Pardo", title = "Multi-Resolution Common Fate Transform", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "342--354", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2878616", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio signal processing; audio signal representation; Audio source separation; audio sources; CFT; channel bank filters; clusterability; fully invertible complex time-frequency representation; high time-frequency overlap; MCFT domain yield; Microsoft Windows; Modulation; multi-resolution common fate transform; multiple audio signals; multiresolution common fate transform; multiresolution property; multiresolution two-dimensional filter bank; resolution issue; separability; signal representation; signal resolution; source separation; Source separation; source signals; state-of-the-art representation; Time-frequency analysis; time-frequency analysis; time-frequency domain; time-frequency signal representations; Transforms; Two dimensional displays", } @Article{Wu:2019:AAC, author = "Y. Wu and W. Li", title = "Automatic Audio Chord Recognition With {MIDI}-Trained Deep Feature and {BLSTM-CRF} Sequence Decoding Model", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "355--366", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2879399", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; audio signal processing; automatic audio chord recognition; Automatic chord recognition; automatic chord recognition tasks; bidirectional long short-term memory (BLSTM); bidirectional long short-term memory conditional random field; BLSTM-CRF sequence decoding model; chord classification; chord recognition systems; CNN feature extractor; conditional random fields (CRF); convolution; convolutional neural network; data-driven feature extraction; Decoding; deep feature extractor; feature extraction; Feature extraction; feedforward neural nets; hand-annotating time-synchronized chord labels; Harmonic analysis; Hidden Markov models; learning (artificial intelligence); machine learning technologies; MIDI-trained deep feature; Music; music; musical instrument digital interface; random processes; real-world music audio recordings; recurrent neural nets; signal classification; Training", } @Article{Imoto:2019:ATM, author = "K. Imoto and N. Ono", title = "Acoustic Topic Model for Scene Analysis With Intermittently Missing Observations", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "367--382", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2879855", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic observations; acoustic scene analysis; Acoustic scene analysis; acoustic scenes; acoustic signal processing; acoustic topic model; acoustic word corresponds; acoustic word transition; Acoustics; Analytical models; Data models; hidden Markov models; Hidden Markov models; Image analysis; Markov model; missing data analysis; missing observations; multiple acoustic words; Privacy; Speech processing", } @Article{Xiao:2019:RME, author = "K. Xiao and S. Wang and M. Wan and L. Wu", title = "Reconstruction of {Mandarin} Electrolaryngeal Fricatives With Hybrid Noise Source", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "383--391", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880607", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "abnormal source location; Acoustic analysis; acoustic signal processing; Acoustics; Attenuation; Cutoff frequency; EL fricative reconstruction; EL source; EL speech production; electrolarynx; fricative reconstruction; hybrid noise source; intelligibility; Mandarin electrolaryngeal fricatives; Mandarin electrolaryngeal speech; Mandarin fricatives; Position measurement; Production; signal denoising; signal reconstruction; speech enhancement; speech intelligibility; Speech processing; transfer functions; voice source; Wideband; wideband noise source", } @Article{Krishnan:2019:FAA, author = "L. Krishnan and T. Betlehem and P. D. Teal", title = "Fast Algorithms for Acoustic Impulse Response Shaping", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "392--403", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880317", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic impulse response shaping; acoustic signal processing; Convergence; Dual Augmented Lagrangian Method (DALM); fast algorithms; Fenchel conjugate; Fenchel duality theorem; filtering theory; impulse response shaping; Loudspeakers; Microphones; microphones; Minimization; Reverberation; reverberation; room acoustics; room compensation; shaping algorithm; shaping filters; soft thresholding function; Speech processing; transient response", } @Article{Zakeri:2019:AIH, author = "V. Zakeri and A. J. Hodgson", title = "Automatic Identification of Hard and Soft Bone Tissues by Analyzing Drilling Sounds", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "404--414", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2880336", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "biomedical ultrasonics; bone; bone drilling; bone-drilling procedures; bone-out; bone-specific; Bones; bovine tibial bones; Drilling machines; drilling sound; Force; hard bone tissues; hidden Markov model; hidden Markov models; logistic regression; machine learning; Medical acoustics; medical signal processing; random forest; regression analysis; soft bone tissues; sound signals; Speech processing; support vector machine; support vector machines; Support vector machines; Surgery; surgery; surgical drill; tissue identification; Tools; wavelet packet transform coefficients; wavelet transforms", } @Article{Bilbao:2019:DSW, author = "S. Bilbao and B. Hamilton", title = "Directional Sources in Wave-Based Acoustic Simulation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "415--428", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2881336", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustics; approximants; approximation theory; arbitrary directivity; complete solution; detailed modeling; directional character; directional sources; finite difference time domain method; finite difference time domain setting; finite difference time-domain analysis; interpolation; Mathematical model; multipole modeling; Numerical models; point sources; Propagation; Room acoustics; Solid modeling; source modeling; spatial Fourier-based approximation strategy; spatial grid; spatio-temporal domain; Three-dimensional displays; three-dimensional wave equation; Time-domain analysis; underlying grid; volumetric wave-based acoustic simulation; wave equations", } @Article{Zhang:2019:SSC, author = "Y. Zhang and B. Pardo and Z. Duan", title = "{Siamese} Style Convolutional Neural Networks for Sound Search by Vocal Imitation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "429--441", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2868428", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio content; audio feature representations; audio signal processing; convolution; Convolutional neural networks; Databases; encoded features; environmental sound classification; Feature extraction; feature extraction; feedforward neural nets; fully connected network; IMINET; imitation encoder; information retrieval; learning (artificial intelligence); metric learning; Neurons; original sound encoder; Poles and towers; query processing; Siamese style convolutional neural networks; similarity measures; sound search; Speech processing; spoken language recognition; Task analysis; TL-IMINET; transfer learning; unified end-to-end training framework; vocal imitation; Vocal imitation", } @Article{Feng:2019:URB, author = "F. Feng and M. Kowalski", title = "Underdetermined Reverberant Blind Source Separation: Sparse Approaches for Multiplicative and Convolutive Narrowband Approximation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "442--456", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2881925", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Approximation algorithms; approximation theory; blind source separation; Blind source separation; convergence of numerical methods; convergence proof; convolution; convolutive narrowband approximation; Covariance matrices; expectation-maximisation algorithm; Fourier transforms; live recorded mixtures; Manganese; multiplicative narrowband approximation; Narrowband; optimisation; Optimization; optimization framework; optimization problems; reverberant mixtures; reverberation; room impulse response; separation problem; short-time-Fourier-transform; signal representation; sparse component analysis; sparse source signal representation; synthesized recorded mixtures; Time-frequency analysis; time-frequency domain; underdetermined convolutive mixtures; underdetermined reverberant blind source separation", } @Article{Wang:2019:CSS, author = "Z. Wang and D. Wang", title = "Combining Spectral and Spatial Features for Deep Learning Based Blind Speaker Separation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "457--468", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2881912", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; array signal processing; Array signal processing; beamforming; blind source separation; blind speaker separation; chimera++ networks; complementary spectral features; deep clustering; deep learning; direction estimation; enhancement network; estimated direction; Geometry; individual speakers; input feature level; learning (artificial intelligence); Microphone arrays; microphone geometry; microphones; multichannel speaker separation; objective function level; permutation invariant training; reverberant environments; reverberant speaker mixtures; reverberant talker-independent speaker separation; reverberation; source separation; Spatial features; spatial features; speaker recognition; specific spectral structures; Speech processing; strong separation performance; T-F unit level speaker dominance; trained models; Training; two-channel chimera", } @Article{Anonymous:2019:ISPd, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "2", pages = "C3--C3", month = feb, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2893582", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCd, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "C1--469", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2899785", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:ISPe, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "C2--C2", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2899787", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCf, author = "Anonymous", title = "Table of {Contents[Edics]}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "470--471", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2899789", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jahromi:2019:ILH, author = "M. Z. Jahromi and A. Zahedi and J. Jensen and J. {\O}stergaard", title = "Information Loss in the Human Auditory System", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "472--481", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2882913", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic stimuli; Acoustics; auditory cortex; Auditory system; Brain modeling; closed-vocabulary intelligibility test; decoding; Gaussian mixture model; Gaussian processes; hearing; Human auditory system; human listener; human word recognition rate; information loss; information theoretic tools; machine classifier; maximum likelihood classifier; mutual information; Noise measurement; optimal classifiers; Oral communication; pattern classification; Signal to noise ratio; signal to noise ratio; SNR; speech communication model; speech processing; Speech recognition; speech recognition; speech-in-stationary-noise setup; vocabulary", } @Article{Buchris:2019:ISS, author = "Y. Buchris and A. Amar and J. Benesty and I. Cohen", title = "Incoherent Synthesis of Sparse Arrays for Frequency-Invariant Beamforming", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "482--495", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2881536", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "array signal processing; Array signal processing; audio acoustics; Bandwidth; beamformer coefficients; Broadband communication; coherent sparse approach; differential microphone arrays; dimensionality clustering; dimensionality reduction; directivity factor; frequency bin; Frequency-invariant beamformer; frequency-invariant beamformers; frequency-invariant beamforming; incoherent approach; incoherent sparse design; incoherent synthesis; microphone arrays; optimal sensors; Optimization; planar superdirective array designs; Robustness; Sensor arrays; sensors positions; signal waveform distortions; sparse array layout; sparse arrays; sparse design; sparse designs; sparse linear array designs; sparse set; superdirective beamformers; underwater acoustics; uniform array design; uniform arrays; white noise; white noise gain", } @Article{Rahulamathavan:2019:PPI, author = "Y. Rahulamathavan and K. R. Sutharsini and I. G. Ray and R. Lu and M. Rajarajan", title = "Privacy-Preserving {$i$Vector}-Based Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "496--506", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2882731", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "authentication; Bioinformatics; Cryptography; Data privacy; data privacy; Feature extraction; iVector; iVector-based voice verification technique; linear discriminant analysis; linear discriminant analysis techniques; Privacy; privacy-preserving iVector-based speaker verification; privacy-preserving voice verification; random domain; randomized domain; security; Servers; speaker recognition; speech; voice print", } @Article{Zhang:2019:ASR, author = "J. Zhang and Y. Zhao and H. Li and C. Zong", title = "Attention With Sparsity Regularization for Neural Machine Translation and Summarization", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "507--518", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2883740", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "abstractive summarization; attention mechanism; attention weight distribution; de facto standard component; Decoding; Entropy; entropy; final attention distribution; input sentence; language translation; Linear programming; machine translation; minimum entropy regularization; neural machine translation; neural nets; neural sequence; output sequence; relevant input words; sequence tasks; Sequence to sequence learning; sparse attention model; sparsity regularization; sparsity regularization term; Speech processing; Standards; summarization; Task analysis; Training; visual perception", } @Article{Moore:2019:NCM, author = "A. H. Moore and W. Xue and P. A. Naylor and M. Brookes", title = "Noise Covariance Matrix Estimation for Rotating Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "519--530", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2882307", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustic noise; adaptive estimation; array manifold; array orientation; array rotation; array signal processing; beamformers; covariance matrices; Covariance matrices; Covariance matrix estimation; desired source activity; estimated covariance matrix; Estimation; estimation theory; ground truth noise covariance matrix; Harmonic analysis; head-mounted arrays; Indexes; microphone array; Microphone arrays; microphone arrays; microphone signal covariance; microphones; minimum variance distortionless response beamformer; moving microphone array; noise covariance matrix estimation; noise dereverberation; noise field; noise figure 0.05 dB; noise figure 18.0 dB; noise reduction performance; noise suppression; noise-only segments; parametric model; spatial filtering; spatial filters; spherical harmonic analysis; stored model parameters", } @Article{Yang:2019:ESE, author = "G. Yang and H. He and Q. Chen", title = "Emotion-Semantic-Enhanced Neural Network", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "531--543", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2885775", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Computational modeling; convolution neural network; convolutional neural nets; deep learning; ECNN; emoticons; emoticons projections; emotion recognition; emotion-semantic-enhanced convolutional neural network model; emotional signals; emotional space projection operator; Feature extraction; feature representation matrix; learning (artificial intelligence); matrix algebra; microblog sentimental analysis; Natural language processing; natural language processing tasks; pattern classification; Semantics; Sentiment analysis; sentiment analysis; social networking (online); Task analysis", } @Article{Dietzen:2019:CAG, author = "T. Dietzen and A. Spriet and W. Tirry and S. Doclo and M. Moonen and T. {van Waterschoot}", title = "Comparative Analysis of Generalized Sidelobe Cancellation and Multi-Channel Linear Prediction for Speech Dereverberation and Noise Reduction", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "544--558", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2886743", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "array signal processing; Array signal processing; blind speech dereverberation; comparative analysis; data-dependent beamforming; deconvolution; Delays; dereverberation; early reverberant-speech component; Fourier transforms; generalized sidelobe canceler framework; generalized sidelobe cancellation; GSC blocking matrix; GSC framework; incoherent-noise components; MCLP framework; microphones; Microphones; Multi-channel linear prediction; multichannel linear prediction framework; noise reduction; Noise reduction; noise reduction; reverberation; speech enhancement; Speech processing; time domain simulation results; Time-domain analysis", } @Article{Gao:2019:MBC, author = "J. Gao and J. Du and E. Chen", title = "Mixed-Bandwidth Cross-Channel Speech Recognition via Joint Optimization of {DNN}-Based Bandwidth Expansion and Acoustic Modeling", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "559--571", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2886739", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic features; acoustic modeling; Acoustics; automatic speech recognition systems; average relative word error rate reduction; bandwidth expansion; bandwidth expansion networks; bandwidth-dependent models; conventional multiple acoustic models; Data models; Deep neural network; deep neural network-based bandwidth expansion; different recording channels; direct mapping DNN; diversified cross-channel speech data; diversified speech data; diversified training data; DNN-based acoustic models; DNN-based bandwidth expansion; DNN-DM; feature extraction; general framework; Hidden Markov models; highest sampling rate; intermediate target layers; joint optimization; joint training strategies; large-scale Mandarin speech datasets; learning (artificial intelligence); low sampling rates; mixed-bandwidth cross-channel speech recognition; mixed-bandwidth speech recognition; multiple bandwidths; multitask training; Narrowband; neural nets; novel DNN architectures; progressive mapping; progressive stacking network; scene related speech data; specific sampling rate; Speech recognition; speech recognition; transmission channels; unified model; Wideband", } @Article{Deena:2019:RNN, author = "S. Deena and M. Hasan and M. Doulaty and O. Saz and T. Hain", title = "Recurrent Neural Network Language Model Adaptation for Multi-Genre Broadcast Speech Recognition and Alignment", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "572--582", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2888814", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Adaptation models; automatic speech recognition; Context modeling; Data models; feature-based adaptation layer; feature-based RNNLMs; hybrid adaptation techniques; language model adaptation; linear hidden network adaptation layer; multi-domain ASR; multigenre broadcast speech recognition; n-gram language models; recurrent neural nets; recurrent neural network language model adaptation; recurrent neural network language models; RNNLM; RNNLM adaptation techniques; Speech processing; Speech recognition; speech recognition; Speech recognition; Task analysis; Training", } @Article{Gelderblom:2019:SEN, author = "F. B. Gelderblom and T. V. Tronstad and E. M. Viggen", title = "Subjective Evaluation of a Noise-Reduced Training Target for Deep Neural Network-Based Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "583--594", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2882738", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "artificial neural networks; deep neural network; Degradation; neural nets; Neural networks; Noise measurement; noise-reduced training target; noisy speech; POLQA; Signal to noise ratio; speech distortion; Speech enhancement; speech enhancement; speech enhancement systems; speech intelligibility; speech processing; speech quality; speech recognition; speech recognition test; subjective evaluation; Training", } @Article{Valero:2019:LCM, author = "M. Luis Valero and E. A. P. Habets", title = "Low-Complexity Multi-Microphone Acoustic Echo Control in the Short-Time {Fourier} Transform Domain", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "595--609", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2885786", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic coupling; acoustic signal processing; Acoustics; array signal processing; background noise; Convergence; desired near-end speech; echo suppression; echo-to-noise ratio; Estimation; far-end signal; Fourier transforms; high-quality end-to-end communication; loudspeaker; loudspeakers; low-complexity MM-AEC; low-complexity multimicrophone echo controller; microphones; Microphones; modern communication; Multi-microphone acoustic echo control; multi-microphone noise reduction; multimicrophone acoustic echo cancellation techniques; multimicrophone acoustic echo control; multimicrophone speech; near-end room; Noise measurement; relative transfer function estimation; residual echo reduction; short-time Fourier transform; smart devices; speech enhancement; Speech processing; speech processing; Steady-state", } @Article{Zhu:2019:RPA, author = "Q. Zhu and P. Coleman and X. Qiu and M. Wu and J. Yang and I. Burnett", title = "Robust Personal Audio Geometry Optimization in the {SVD}-Based Modal Domain", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "610--620", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2889927", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic contrast control; acoustic signal processing; Acoustics; audio signal processing; broadband equalization; equalisers; Geometry; geometry optimization method; interference; listening zone; Loudspeakers; loudspeakers; natural sound reproduction; optimisation; Optimization; personal audio geometry optimization; personalized listening experiences; planarity control; pressure matching; private listening experiences; quiet zone; regularization; Robustness; robustness; shared space sound zones; singular value decomposition; sound reproduction; sound reproduction perturbations; sound zones; Spatial audio; SVD-based modal domain; system geometry; Transfer functions; Vibrations", } @Article{Yi:2019:LAT, author = "J. Yi and J. Tao and Z. Wen and Y. Bai", title = "Language-Adversarial Transfer Learning for Low-Resource Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "621--630", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2889606", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic model; Acoustics; Adaptation models; adversarial learning; adversarial SHL-model; Adversarial training; cross-lingual; Knowledge transfer; language invariant features; language-adversarial transfer learning; learning (artificial intelligence); Learning systems; low resource conditions; low-resource; Neural networks; shared features; shared hidden layer model; speech recognition; Speech recognition; speech recognition; target language; target model; Training; transfer learning; unnecessary language dependent information", } @Article{Zhang:2019:SSA, author = "J. Zhang and Z. Ling and L. Liu and Y. Jiang and L. Dai", title = "Sequence-to-Sequence Acoustic Modeling for Voice Conversion", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "631--644", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2892235", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic features; acoustic models; Acoustics; appropriate duration conversion; attention; automatic speech recognition model; Cloning; conversion stage; Decoding; deep neural networks; Feature extraction; feature extraction; feature sequences; Gaussian mixture models; Gaussian processes; Linguistics; Mel-scale spectrograms; Mel-spectrogram; Mel-spectrograms; neural nets; SCENT model; sequence-to-sequence; sequence-to-sequence acoustic modeling; sequence-to-sequence ConvErsion NeTwork; source speech; source utterances; Speech processing; speech recognition; speech signals; target speakers; training stage; unified acoustic model; vocal tract descriptions; Vocoders; vocoders; Voice conversion; Voice Conversion Challenge 2018", } @Article{Li:2019:MSS, author = "X. Li and L. Girin and S. Gannot and R. Horaud", title = "Multichannel Speech Separation and Enhancement Using the Convolutive Transfer Function", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "645--659", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2892412", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "1-norm minimization; 2-norm fitting cost; approximation theory; array signal processing; Audio source separation; basis pursuit method; beamforming-like multichannel inverse filtering method; computational cost; Convolution; convolutive transfer function; convolutive transfer function approximation; CTF domain; filter perturbations; filtering theory; Fourier transforms; Lasso optimization; microphone signals; microphones; Microphones; minimisation; MINT; mixing filters; mixing model; multichannel convolutive mixtures; multichannel speech enhancement; multichannel speech separation; multiple input-output inverse theorem; noise power level; noisy mixtures; power minimization; reverberation; short-time Fourier transform; short-time Fourier transform domain; single-source MINT; Source separation; source separation; spectral sparsity; speech enhancement; Speech enhancement; Time-domain analysis; time-domain filters; time-domain inverse filters; time-domain Lasso; transfer functions; Transfer functions", } @Article{Anonymous:2019:ISPf, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "3", pages = "C3--C3", month = mar, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2899791", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCg, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "C1--660", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2899859", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:ISPg, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "C2--C2", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2899863", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCh, author = "Anonymous", title = "Table of {Contents[Edics]}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "661--662", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2899861", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2019:CNN, author = "Z. Zhao and H. Liu and T. Fingscheidt", title = "Convolutional Neural Networks to Enhance Coded Speech", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "663--678", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2018.2887337", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "adaptive codes; adaptive multirate wideband codec; category rating listening testing; cepstral analysis; Cepstral analysis; cepstral domain feature approach; CMOS integrated circuits; CMOS points; coded speech enhancement; convolutional codes; convolutional neural nets; convolutional neural networks; Convolutional neural networks; far-end acoustic background noise; G.711-coded speech; ITU-T-standardized postfilter; narrowband speech codecs; Noise measurement; postprocessing approaches; Quantization (signal); quantization noise; Signal to noise ratio; speech codecs; speech coding; Speech coding; Speech enhancement; speech enhancement; speech quality evaluation; statistical analysis; statistical significance; time domain approaches; time-domain analysis; time-domain approach; transmission errors; uncoded speech; wideband speech codecs", } @Article{Schepker:2019:NSB, author = "H. Schepker and S. E. Nordholm and L. T. T. Tran and S. Doclo", title = "Null-Steering Beamformer-Based Feedback Cancellation for Multi-Microphone Hearing Aids With Incoming Signal Preservation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "679--691", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2892234", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic feedback; Acoustic feedback cancellation; acoustic feedback paths; acoustic signal processing; Acoustics; adaptive filter; adaptive filters; array signal processing; biased optimal solution; closed-loop acoustical system; fixed beamformer; hearing aid loudspeaker; Hearing aids; hearing aids; incoming signal directions; incoming signal preservation; least squares approximations; least-squares optimization; least-squares optimization procedure; Loudspeakers; loudspeakers; microphones; Microphones; min-max optimization; min-max optimization procedure; minimax techniques; multimicrophone hearing aids; multiple integrated microphones; null-steering; null-steering beamformer-based feedback cancellation; Optimization; perfect feedback cancellation; residual feedback power; Speech processing; transfer functions; Transfer functions", } @Article{Li:2019:LGO, author = "Z. Li and Y. Song and L. Dai and I. McLoughlin", title = "Listening and Grouping: an Online Autoregressive Approach for Monaural Speech Separation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "692--703", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2892241", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "autoregressive processes; causal temporal context; closed-set evaluation; computational auditory scene analysis; deep learning; Deep learning; deep learning power; Extraterrestrial measurements; frame levels; grouping architecture; grouping stage; Image analysis; label permutation problem; learned listening; learning (artificial intelligence); multispeaker monaural speech separation; Neural networks; online autoregressive approach; open-set evaluation; segment levels; signal-to-distortion ratio; Speech processing; speech quality scores; speech recognition; Speech separation; Task analysis; Training; WSJ0-2mix benchmark", } @Article{Deng:2019:SLC, author = "D. Deng and L. Jing and J. Yu and S. Sun and M. K. Ng", title = "Sentiment Lexicon Construction With Hierarchical Supervision Topic Model", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "704--718", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2892232", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "data mining; hierarchical supervision information; hierarchical supervision topic model; Modeling; Motion pictures; multinomial distribution; Neural networks; opinion mining; pattern classification; Probabilistic logic; probability; Sentiment analysis; sentiment analysis; Sentiment analysis; sentiment analysis; sentiment classification; sentiment lexicon construction; Speech processing; Sun; text mining; topic model; topic-adaptive sentiment lexicon", } @Article{Zhou:2019:SES, author = "M. Zhou and M. Huang and X. Zhu", title = "Story Ending Selection by Finding Hints From Pairwise Candidate Endings", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "719--729", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2893499", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "commonsense reasoning; Computational modeling; Context modeling; ending vector prediction; evidence bias issue; four-sentence story context; humanities; Machine reading comprehension; machine reading comprehension; natural language processing; Natural languages; neural nets; neural networks; pairwise candidate endings; Predictive models; query processing; Semantics; Speech processing; Story Cloze Test; story comprehension; story ending selection; Task analysis; vectors", } @Article{Richter:2019:ICS, author = "J. Richter and J. Fels", title = "On the Influence of Continuous Subject Rotation During High-Resolution Head-Related Transfer Function Measurements", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "730--741", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2894329", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustic measurements; acoustic signal processing; artificial head; audible influence; audio signal processing; continuous measurement rotation; continuous rotation; continuous subject rotation; HRTF measurement; individual head-related transfer function; Interpolation; interpolation; loudspeaker arrays; loudspeakers; Loudspeakers; loudspeakers; measurement signals; microphone arrays; objective comparison; Position measurement; position measurement; Rotation measurement; rotation measurement; rotation speed; rotation speeds; Signal resolution; signal resolution; sine sweep measurements; step-wise measurement rotation; step-wise subject positioning; subjective comparison; subjective listening experiment; Time measurement; time measurement; transfer functions", } @Article{Yu:2019:ASI, author = "J. Yu and K. Markov and T. Matsui", title = "Articulatory and Spectrum Information Fusion Based on Deep Recurrent Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "742--752", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2894554", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic features; acoustic model DNN; acoustic-to-articulatory inversion; Acoustics; AM DNN training; articulatory features; articulatory information; articulatory inversion DNN; Automatic speech recognition; automatic speech recognition systems; Computational modeling; Data models; deep neural networks-hidden Markov model hybrid; deep recurrent neural networks; distillation training; DNN acoustic model; feature-based approach; feature-based method; Hidden Markov models; hidden Markov models; model-based approach; model-based method; phoneme recognition system; recognition time; recurrent neural nets; speech processing; Speech processing; Speech recognition; speech recognition; Training; underlying acoustic model", } @Article{Itturriet:2019:PRP, author = "F. P. Itturriet and M. H. Costa", title = "Perceptually Relevant Preservation of Interaural Time Differences in Binaural Hearing Aids", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "753--764", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2895973", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic noise; acoustic signal processing; aid designers; binaural; binaural hearing aids; Cost function; developed MWF-ITD technique; diffuse noise fields; directional acoustic noise source; directional noise source; Ear; Hearing aids; hearing aids; Integrated circuits; interaural coherence concept; interaural phase difference; interaural time difference; ITD binaural cues; ITD subjective perception; microphones; Microphones; multichannel Wiener filter; MWF-IC technique; noise reduction; noise reduction method; noise reduction technique; original IC magnitude; processed noise; residual noise spatial preservation; signal denoising; spatial subjective sensation; speech processing; Wiener filter; Wiener filters", } @Article{Abel:2019:SBL, author = "J. Abel and T. Fingscheidt", title = "Sinusoidal-Based Lowband Synthesis for Artificial Speech Bandwidth Extension", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "765--776", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2895969", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic bandwidth; artificial speech bandwidth extension; Artificial speech bandwidth extension; CMOS points; conventional narrowband telephony; Estimation; Frequency estimation; Harmonic analysis; Hidden Markov models; high-frequency components; instrumental quality assessment; low-frequency band; lowband; NB speech; sinusoidal; spectral analysis; spectrally balanced speech signals; Speech coding; speech coding; speech enhancement; Speech enhancement; speech intelligibility; speech processing; speech quality; speech synthesis", } @Article{Kong:2019:SED, author = "Q. Kong and Y. Xu and I. Sobieraj and W. Wang and M. D. Plumbley", title = "Sound Event Detection and Time Frequency Segmentation from Weakly Labelled Data", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "777--787", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2895254", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal detection; acoustic signal processing; audio signal processing; classification mapping; convolutional neural network; Convolutional neural networks; DCASE 2018 Task 2 sound events data; Event detection; feature extraction; learning (artificial intelligence); neural nets; probability; segmentation mapping; Sound event detection; sound event detection; Spectrogram; speech recognition; supervised SED algorithms; T-F segmentation masks; Tagging; Task analysis; Time-frequency analysis; time-frequency segmentation; Training; weakly labelled data", } @Article{Tuan:2019:ICS, author = "Y. Tuan and H. Lee", title = "Improving Conditional Sequence Generative Adversarial Networks by Stepwise Evaluation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "788--798", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2896437", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "chit-chat dialogue generation; computational costs; conditional sequence generation tasks; conditional sequence generative adversarial networks; Decoding; Gallium nitride; Generative adversarial network; Generative adversarial networks; Generators; interactive systems; Maximum likelihood estimation; MCTS; Monte Carlo methods; Monte Carlo tree search; neural nets; REGS; SeqGAN; sequence generation; StepGAN; stepwise evaluation; stepwise GAN; Task analysis; Training; tree searching", } @Article{Dionelis:2019:MDK, author = "N. Dionelis and M. Brookes", title = "Modulation-Domain {Kalman} Filtering for Monaural Blind Speech Denoising and Dereverberation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "799--814", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2894909", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "adaptive algorithm; adaptive filters; blind joint denoising; dereverberation; direct-to-reverberant energy ratio; DRR; interframe speech dynamics; Kalman filter update step models; Kalman filtering; Kalman filters; log-magnitude spectrum; minimum mean-square error (MMSE) estimation; modulation; modulation-domain Kalman filtering; monaural blind speech denoising; monaural blind speech dereverberation; monaural speech enhancement algorithm; Noise measurement; Noise reduction; noisy reverberant speech; posterior distribution estimation; reverberant speech to noise ratios; reverberation; Reverberation; reverberation time T60 parameters; signal denoising; Speech enhancement; speech enhancement; Speech enhancement; speech intelligibility; speech intelligibility quality; speech log-magnitude spectrum estimation; Time-frequency analysis; time-frequency log-magnitude spectra", } @Article{Lotfian:2019:CLS, author = "R. Lotfian and C. Busso", title = "Curriculum Learning for Speech Emotion Recognition From Crowdsourced Labels", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "815--826", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2898816", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "classification task; Computers; crowdsourced labels; curriculum learning; Curriculum learning; deep neural networks; DNNs; emotion perception; emotion recognition; Emotion recognition; emotional content; human judgments; inter-evaluator agreement; learning (artificial intelligence); Machine learning; machine learning problems; multiclass classification; neural nets; pattern classification; regression analysis; regression problems; speech emotion recognition; Speech processing; Speech recognition; speech recognition; speech samples; Task analysis; Training", } @Article{Lin:2019:RPE, author = "S. Lin", title = "Robust Pitch Estimation and Tracking For Speakers Based on Subband Encoding and The Generalized Labeled Multi-{Bernoulli} Filter", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "827--841", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2898818", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "additive noise; auditory filterbank; autocorrelation; CASA; channel bank filters; computational auditory scene analysis approach; correlation methods; Estimation; estimation theory; frequency coverage; frequency coverage metric; Frequency estimation; generalized labeled multiBernoulli filter; GLMB tracking filter; Harmonic analysis; Hidden Markov models; measurement driven birth; measurement-driven birth model; normalized autocorrelation calculation; Ornstein Uhlenbeck process; Ornstein-Uhlenbeck process; pitch state transition model; Pitch tracking; robust pitch estimation methods; robust pitch tracker; sound signal decomposition; speaker estimation; speaker recognition; speaker tracking; speech coding; Speech processing; spurious error suppression; subband encoding; subband signals; Target tracking; temporal continuity constraint; time-frequency analysis; Time-frequency analysis; time-frequency sparsity", } @Article{Wang:2019:RHD, author = "X. Wang and I. Cohen and J. Chen and J. Benesty", title = "On Robust and High Directive Beamforming With Small-Spacing Microphone Arrays for Scattered Sources", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "842--852", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2899517", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic radiators; acoustic wave scattering; Acoustics; Array signal processing; array signal processing; broadband acoustic source processing; diffuse noise gain; diffuse noise suppression; directional noise suppression; frequency-invariant beamformer; generalized MDNG beamformer; joint diagonalization technique; low white noise gain; maximum diffuse noise gain beamformer; maximum WNG beamformer; Microphone array; microphone arrays; Microphone arrays; MWNG beamformer; robust high directive beamforming; scattered acoustic source processing; scattered source; Sensor arrays; small-spacing microphone arrays; White noise; white noise; white noise gain", } @Article{Quan:2019:EFS, author = "Z. Quan and Z. Wang and Y. Le and B. Yao and K. Li and J. Yin", title = "An Efficient Framework for Sentence Similarity Modeling", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "853--865", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2899494", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "attention constituency vector tree; attention weight; attention weight mechanisms; Kernel; Natural language processing; natural language processing; natural language processing applications; neural network methods; Neural networks; semantic information; semantic textual similarity datasets; Semantics; sentence embedding; Sentence similarity; sentence similarity measure; sentence similarity modeling; Speech processing; structured trees; syntactic information; syntactic structure; Syntactics; text analysis; tree kernel; trees (mathematics); Vegetation; word embedding; word embedding techniques", } @Article{Lubis:2019:PEE, author = "N. Lubis and S. Sakti and K. Yoshino and S. Nakamura", title = "Positive Emotion Elicitation in Chat-Based Dialogue Systems", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "866--877", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2900910", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Affective computing; affective computing; affective dialogue systems; Appraisal; chat-based dialogue system; chat-based dialogue systems; Crowdsourcing; Databases; dialogue corpus; dialogue system interaction; elicit positive emotion; emotion appraisal; emotion elicitation; emotion recognition; Emotion recognition; emotion-rich corpora; emotion-sensitive neural chat-based dialogue system; emotional benefit; emotional support; human computer interaction; information retrieval; interactive systems; Natural language processing; natural language processing; neural nets; Neural networks; neural networks; positive emotion elicitation corpus; positive emotional response; positive emotional states; positive emotional valence; Speech processing", } @Article{Anonymous:2019:ISPh, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "4", pages = "C3--C3", month = apr, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2899865", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCi, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "27", number = "5", pages = "C1--878", month = may, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2905796", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:ISPi, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "5", pages = "C2--C2", month = may, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2905798", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCj, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "27", number = "5", pages = "879--880", month = may, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2905800", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ibarrola:2019:SDS, author = "F. J. Ibarrola and R. D. Spies and L. E. D. Persia", title = "Switching Divergences for Spectral Learning in Blind Speech Dereverberation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "5", pages = "881--891", month = may, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2901643", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "artificial reverberation; Atomic measurements; audio quality; audio signal processing; blind speech dereverberation; Cost function; cost function minimization; dereverberation; Dictionaries; dictionary learning; enclosed room; fidelity term; Frequency measurement; generalized -divergence; human computer interaction; human-machine interaction technologies; learning (artificial intelligence); nonnegative representation; observed spectrogram; optimal fidelity parameter; penalization; real recordings; reverberation; Reverberation; reverberation model; Signal processing; signal representation; sound signal; spectral learning; spectral structure; Spectrogram; speech processing; Speech processing; two-stage dereverberation approach", } @Article{Cohen:2019:DKP, author = "I. Cohen and J. Benesty and J. Chen", title = "Differential {Kronecker} Product Beamforming", journal = j-IEEE-ACM-TASLP, volume = "27", number = "5", pages = "892--902", month = may, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2895241", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustic arrays; Acoustics; array signal processing; Array signal processing; beampattern; Covariance matrices; Differential beamforming; differential Kronecker product beamformers; differential Kronecker product beamforming; directivity factor; front-to-back ratio; Kronecker product; Kronecker product decomposition; Kronecker product formulation; microphone array; microphone arrays; Microphone arrays; steering vector; superdirective beamforming; tradeoff control; vectors; virtual arrays; white noise; White noise; white noise gain", } @Article{Elisei-Iliescu:2019:RLS, author = "C. Elisei-Iliescu and C. Paleologu and J. Benesty and C. Stanciu and C. Anghel and S. Ciochin{\u{a}}", title = "Recursive Least-Squares Algorithms for the Identification of Low-Rank Systems", journal = j-IEEE-ACM-TASLP, volume = "27", number = "5", pages = "903--918", month = may, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2903276", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Adaptive filter; adaptive filters; Adaptive systems; Approximation algorithms; Complexity theory; computationally efficient versions; Convergence; convergence/tracking capabilities; DCD iterations; dichotomous coordinate descent iterations; echo cancellation; Echo cancellers; echo suppression; fast convergence rate; FIR filters; gradient methods; high-dimension system identification problem; impulse response decomposition; iterative methods; least mean squares methods; least squares approximations; long length adaptive filters; long length impulse responses; low-dimension problems; low-rank approximation; low-rank systems identification; Matrix decomposition; nearest Kronecker product; QR decomposition techniques; recursive least-squares (RLS) algorithm; recursive least-squares algorithms; regularization; RLS algorithm; Speech processing; system identification; system identification problems; Wiener filter; Wiener filters", } @Article{Kumar:2019:DLV, author = "A. Kumar and T. Guha and P. K. Ghosh", title = "{Dirichlet} Latent Variable Model: a Dynamic Model Based on {Dirichlet} Prior for Audio Processing", journal = j-IEEE-ACM-TASLP, volume = "27", number = "5", pages = "919--931", month = may, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2903288", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio processing applications; audio signal processing; Data models; Dirichlet distribution; Dirichlet latent variable model; dynamic Dirichlet; dynamic latent variable model; dynamic parameters; expectation-maximisation algorithm; exponential family distributions; Hidden Markov models; Latent variable model; learning (artificial intelligence); NMF; NMF dynamic version; non negative; nonnegative matrix factorization; probabilistic latent component analysis; Probabilistic logic; Signal processing algorithms; source separation; Source separation; speaker source separation; Speech processing; time varying", } @Article{Jancovic:2019:BSR, author = "P. Jancovic and M. K{\"o}k{\"u}er", title = "Bird Species Recognition Using Unsupervised Modeling of Individual Vocalization Elements", journal = j-IEEE-ACM-TASLP, volume = "27", number = "5", pages = "932--947", month = may, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2904790", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic modeling; acoustic models; acoustic scene; acoustic signal detection; acoustic signal processing; Acoustics; audio field recordings; audio recording; audio signal processing; bioacoustics; biology computing; bird species identification; bird species recognition; Bird species recognition; bird vocalization elements; Birds; DNN-HMM; element models; Feature extraction; field recording; hidden Markov model; hidden Markov models; Hidden Markov models; hybrid deep neural network-hidden Markov model; iterative maximum likelihood label re-assignment procedure; maximum likelihood estimation; multiple bird species; neural nets; Noise measurement; nonbird sound recordings; normalized magnitude values; postrecognition stage; recognition accuracy; segmentation; signal classification; sinusoid; sound field recordings; Speech processing; Speech recognition; speech recognition; state duration modeling; unsupervised; unsupervised modeling; vocalisation element", } @Article{Koriyama:2019:SPS, author = "T. Koriyama and T. Kobayashi", title = "Statistical Parametric Speech Synthesis Using Deep {Gaussian} Processes", journal = j-IEEE-ACM-TASLP, volume = "27", number = "5", pages = "948--959", month = may, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2905167", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "approximation method; approximation theory; Bayes methods; Bayesian model; contextual features; conventional framework; deep architecture model; deep Gaussian processes; deep neural network-based speech synthesis; DGP framework; doubly stochastic variational inference; feedforward DNN-based method; Gaussian process; Gaussian processes; Global Positioning System; Hidden Markov models; Kernel; learning (artificial intelligence); model complexity; neural nets; Neural networks; regression analysis; speech parameters; Speech synthesis; speech synthesis; stacked Bayesian kernel regressions; Statistical parametric speech synthesis; statistical parametric speech synthesis framework; stochastic variational inference; Training data", } @Article{Shimada:2019:USE, author = "K. Shimada and Y. Bando and M. Mimura and K. Itoyama and K. Yoshii and T. Kawahara", title = "Unsupervised Speech Enhancement Based on Multichannel {NMF}-Informed Beamforming for Noise-Robust Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "27", number = "5", pages = "960--971", month = may, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2907015", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "array signal processing; Array signal processing; audio signal processing; beamforming; Covariance matrices; covariance matrices; Estimation; full-rank multichannel Wiener filters; minimum variance distortionless response beamforming; multichannel NMF-informed beamforming; multichannel nonnegative matrix factorization; multichannel speech enhancement; MVDR beamformers; neural nets; noise components; Noise measurement; noise-robust automatic speech recognition; noisy environments; Noisy speech recognition; observed noisy mixtures; rank-1 multichannel Wiener filters; separated speech; source separation; spatial information; Spectrogram; speech enhancement; Speech enhancement; speech recognition; time-frequency bin; unknown noisy environment; unsupervised approach; unsupervised speech enhancement; Wiener filters", } @Article{Widmark:2019:CMO, author = "S. Widmark", title = "Causal {MSE}-Optimal Filters for Personal Audio Subject to Constrained Contrast", journal = j-IEEE-ACM-TASLP, volume = "27", number = "5", pages = "972--987", month = may, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2904839", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic contrast; acoustic signal processing; Acoustics; audio signal processing; bright zone behavior; causal MSE-optimal filters; constrained contrast; Design methodology; direct method; filtering theory; filters; Frequency control; frequency-domain analysis; Frequency-domain analysis; frequency-domain optimal method; IIR filters; Mathematical model; novel design method; optimisation; Optimization; personal audio subject; pre-compensation filters; pre-existing noncausal methods; Signal processing; sound-system-room interactions; spectral bright zone behavior; Speech processing; unattainable contrasts", } @Article{Anonymous:2019:AAI, author = "Anonymous", title = "Article Awards for the {{\booktitle{IEEE\slash ACM Transactions on Audio, Speech, and Language Processing}}}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "5", pages = "988--988", month = may, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2908575", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Awards", } @Article{Anonymous:2019:ISPj, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "5", pages = "C3--C3", month = may, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2905802", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCk, author = "Anonymous", title = "Table of contents", journal = j-IEEE-ACM-TASLP, volume = "27", number = "6", pages = "C1--989", month = jun, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2910095", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:ISPk, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "6", pages = "C2--C2", month = jun, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2910097", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCEb, author = "Anonymous", title = "Table of contents {(EDICS)}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "6", pages = "990--991", month = jun, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2910099", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mesaros:2019:SED, author = "A. Mesaros and A. Diment and B. Elizalde and T. Heittola and E. Vincent and B. Raj and T. Virtanen", title = "Sound Event Detection in the {DCASE 2017} Challenge", journal = j-IEEE-ACM-TASLP, volume = "27", number = "6", pages = "992--1006", month = jun, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2907016", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal detection; acoustic signal processing; Acoustics; confidence interval calculation; confidence intervals; DCASE 2017 challenge; deep neural networks; Detection and Classification of Acoustic Scenes and Events; detection requirements; Event detection; Glass; Hidden Markov models; jackknife estimates; jackknife resampling procedure; learning (artificial intelligence); maximization-minimization; mel frequency-based representations; neural nets; overlapping events; pattern recognition; ranking metric; signal classification; signal representation; Sound event detection; sound event detection; Speech processing; statistical analysis; target sound events; Task analysis; task-specific optimization; testing data; Training; training data; weak labels; weakly labeled data", } @Article{Chetupalli:2019:LRC, author = "S. R. Chetupalli and T. V. Sreenivas", title = "Late Reverberation Cancellation Using {Bayesian} Estimation of Multi-Channel Linear Predictors and {Student}'s $t$-Source Prior", journal = j-IEEE-ACM-TASLP, volume = "27", number = "6", pages = "1007--1018", month = jun, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2906427", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Bayes methods; Bayesian estimation; Bayesian learning; channel estimation; delayed linear predictor; Dereverberation; early reflection component; enhanced signals; Estimation; expectation-maximisation algorithm; Fourier transforms; gamma distributed precision; gamma distribution; Gaussian distribution; Gaussian source model; hyper-parameter estimation; inference estimation; late reverberation cancellation; late reverberation suppression; linear prediction; MCLP; microphone; Microphones; MIMO communication; MIMO schemes; MISO communication; MISO scheme; multichannel linear predictors; multichannel output schemes; prediction residual; Predictive models; real room impulse responses; residual signal estimation; Reverberation; reverberation; short-time Fourier transform; single channel output schemes; sparse coefficient vector; spatial filtering; spatial filters; stochastic models; student t-distribution model; student t-source prior; time-dependent precision; transient response; variational Bayes expectation maximization algorithm; variational inference; variational techniques; VBEM algorithm", } @Article{Juvela:2019:GRW, author = "L. Juvela and B. Bollepalli and V. Tsiaras and P. Alku", title = "{GlotNet} --- a Raw Waveform Model for the Glottal Excitation in Statistical Parametric Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "27", number = "6", pages = "1019--1030", month = jun, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2906484", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic features; Acoustics; Computational modeling; direct speech waveform model; feedforward neural nets; generative neural network models; GlotNet; glottal excitation waveforms; glottal pulseforms; Glottal source model; glottal vocoders; Hidden Markov models; human voice production mechanism; model complexity; model size; Neural networks; raw audio; raw waveform glottal excitation model; raw waveform model; speech processing; speech synthesis; Speech synthesis; speech waveforms; statistical analysis; statistical parametric speech synthesis; statistical parametric TTS system; statistical vocoders; straightforward deep feedforward neural networks; synthesis quality; text-to-speech; text-to-speech synthesis; time-domain waveforms; vocoders; Vocoders; voice similarity; waveform generator architecture; WaveNet; WaveNet-like architecture", } @Article{Winter:2019:GMP, author = "F. Winter and F. Schultz and G. Firtha and S. Spors", title = "A Geometric Model for Prediction of Spatial Aliasing in {$ 2.5 $D} Sound Field Synthesis", journal = j-IEEE-ACM-TASLP, volume = "27", number = "6", pages = "1031--1046", month = jun, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2892895", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "2.5D sound field synthesis; acoustic signal processing; active prioritization; analytical sound field synthesis approaches; anti-aliasing criteria; approximation theory; arbitrary convex loudspeaker arrays; array signal processing; artefact-free synthesis; control region; conventional wave field synthesis; finite ensemble; Frequency synthesizers; fundamental sound fields; geometric model; geometrical framework; geometry; Geometry; local sound field synthesis approaches; local wave field synthesis; loudspeaker array arrangements; loudspeakers; Loudspeakers; Mathematical model; Numerical models; numerical simulation; plane waves; predicted spatial structure; Predictive models; ray-approximation; signal sampling; signal synthesis; Sound field synthesis; sound reproduction; spatial aliasing; spatial aliasing artefacts; spatial aliasing avoidance; spatial sampling process; spatial structure; Speech processing; spherical waves; synthesis problem; synthesised sound fields; time 2.5 d", } @Article{Liu:2019:AAV, author = "Y. Liu and T. Lee and T. Law and K. Y. Lee", title = "Acoustical Assessment of Voice Disorder With Continuous Speech Using {ASR} Posterior Features", journal = j-IEEE-ACM-TASLP, volume = "27", number = "6", pages = "1047--1059", month = jun, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2905778", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic features; acoustical assessment; ASR features; ASR posterior features; ASR-based voice features; automatic speech recognition system; automating voice assessment; continuous speech; continuous speech utterances; conventional features; conventional voice features; Databases; deep neural network; disordered voice; DNN based ASR system; Feature extraction; homogeneous speech samples; individual utterances; low-dimension ASR-based feature vector; Mel frequency cepstral coefficient; mild disorder; neural nets; normal voice; Pathology; phone posterior probabilities; posterior features; probability; Reliability; severe disorder; Speech processing; speech recognition; subject-level prediction accuracy; sustained vowels; Task analysis; utterance-level prediction accuracy; Voice assessment; voice disorder severity", } @Article{Porschmann:2019:DES, author = "C. P{\"o}rschmann and J. M. Arend and F. Brinkmann", title = "Directional Equalization of Sparse Head-Related Transfer Function Sets for Spatial Upsampling", journal = j-IEEE-ACM-TASLP, volume = "27", number = "6", pages = "1060--1071", month = jun, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2908057", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; directional equalization; directional rigid sphere transfer function; full-spherical sets; Harmonic analysis; head-related transfer functions; head-related transfer functions (HRTFs); interpolation; Interpolation; inverse SH transform; inverse transforms; order-limitation errors; set theory; SH interpolation; sparse datasets; sparse HRTF set; Spatial audio; spatial complexity; Spatial resolution; spatial upsampling; spectral components; Speech processing; spherical harmonics; temporal component; Time-domain analysis; Transfer functions; transfer functions; Transforms", } @Article{Payal:2019:ENP, author = "S. S. Payal and V. J. Mathews and D. J. Button and A. Iyer and R. H. Lambert and J. Hutchings and L. A. Azpicueta-Ruiz", title = "Equalization of Nonlinear Propagation Distortion in Cylindrical Waveguides", journal = j-IEEE-ACM-TASLP, volume = "27", number = "6", pages = "1072--1084", month = jun, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2908279", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustic distortion; acoustic waveforms; Acoustic waveguides; air-filled waveguide; Atmospheric modeling; Burgers propagation model; circular waveguides; equalisers; equalization; Equalizers; forward model; harmonic distortion; high sound pressure levels; intermodulation distortion; inverse problems; Mathematical model; model-based method; model-based pre-equalizer; Nonlinear acoustics; nonlinear distortion; Nonlinear distortion; nonlinear equalization; nonlinear propagation distortion; nonlinear systems; propagation-induced distortion; sign-inverted propagation model; total harmonic distortion; wave propagation", } @Article{Sisman:2019:GSR, author = "B. Sisman and M. Zhang and H. Li", title = "Group Sparse Representation With {WaveNet} Vocoder Adaptation for Spectrum and Prosody Conversion", journal = j-IEEE-ACM-TASLP, volume = "27", number = "6", pages = "1085--1097", month = jun, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2910637", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "activation matrix; Continuous wavelet transforms; conversion framework; Dictionaries; energy contour; feature conversion module; feature conversion studies; Gaussian processes; general speech corpus; general speech databases; group sparse representation; group sparsity mathematical formulation; matrix algebra; natural language processing; objective evaluations; phonetic dictionary; phonetic posteriorgrams; phonetic posteriorgrams (PPGs); phonetic sparse representation; Phonetics; PPG generator; prosody conversion; prosody conversion techniques; prosody features; signal representation; source-target training data; Sparse matrices; speaker characteristic transformation; speaker identity; spectral features; spectrum conversion; speech coding; statistical analysis; statistical approach; subjective evaluations; tandem feature; target speaker data; Training data; vocoders; Vocoders; vocoding quality; Voice conversion; voice conversion quality; wavenet vocoder; WaveNet vocoder adaptation", } @Article{Lee:2019:JLA, author = "J. Lee and H. Kang", title = "A Joint Learning Algorithm for Complex-Valued {T--F} Masks in Deep Learning-Based Single-Channel Speech Enhancement Systems", journal = j-IEEE-ACM-TASLP, volume = "27", number = "6", pages = "1098--1108", month = jun, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2910638", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "complex-valued T-F masks; complex-valued time-frequency mask; complex-valued time-frequency masks; Dynamic range; exact time-domain reconstruction; input noisy phase component; irregular spectrogram pattern; joint learning algorithm; large-scale deep learning network; learning (artificial intelligence); Learning systems; Linear programming; microphones; Noise measurement; phase spectra; single-channel microphone environment; Single-channel speech enhancement; single-channel speech enhancement systems; sound quality; spectrogram consistency; speech enhancement; Speech enhancement; speech enhancement algorithms; Time-domain analysis; time-frequency analysis", } @Article{Anonymous:2019:ISPl, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "6", pages = "C3--C3", month = jun, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2910101", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCl, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "27", number = "7", pages = "C1--1109", month = jul, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2915179", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:ISPm, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "7", pages = "C2--C2", month = jul, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2915181", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCm, author = "Anonymous", title = "Table of {Contents[Edics]}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "7", pages = "1110--1111", month = jul, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2915183", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Flessner:2019:SOA, author = "J. Fle{\ss}ner and T. Biberger and S. D. Ewert", title = "Subjective and Objective Assessment of Monaural and Binaural Aspects of Audio Quality", journal = j-IEEE-ACM-TASLP, volume = "27", number = "7", pages = "1112--1125", month = jul, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2904850", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic noise; Audio quality; audio signal processing; auditory model; BAM-Q; binaural audio quality degradation prediction; binaural auditory-model-based quality prediction; binaural quality aspects; binaural signal distortions; combined monaural-binaural model; Databases; distortion; Distortion measurement; generalized power-spectrum model; generalized power-spectrum model for quality; GPSMq; joint overall audio predictions; monaural signal distortions; Nonlinear distortion; objective assessment; Predictive models; Psychoacoustic models; Psychoacoustics; spatial audio; subjective assessment", } @Article{Yusuf:2019:LRK, author = "B. Yusuf and B. Gundogdu and M. Saraclar", title = "Low Resource Keyword Search With Synthesized Crosslingual Exemplars", journal = j-IEEE-ACM-TASLP, volume = "27", number = "7", pages = "1126--1135", month = jul, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2911164", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic data; Acoustics; ASR-based baseline results; average term weighted value; bottleneck features; data scarcity; data-scarce settings; distance metric learning; dynamic time warping; EDML systems; exemplar matching; extended distance metric learner; Keyword search; keyword search performance; Lattices; low resource keyword search; multilingual acoustic model; multilingual features; multilingual network; natural language processing; Neural networks; out-of-vocabulary terms; query by example; query processing; query-by-example task; source languages; speech processing; speech recognition; Spoken term detection; synthesized crosslingual exemplars; synthetic phone exemplars; target language; Training; Training data; training data; transfer learning; Vocabulary", } @Article{Koutrouvelis:2019:RJE, author = "A. I. Koutrouvelis and R. C. Hendriks and R. Heusdens and J. Jensen", title = "Robust Joint Estimation of Multimicrophone Signal Model Parameters", journal = j-IEEE-ACM-TASLP, volume = "27", number = "7", pages = "1136--1150", month = jul, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2911167", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; array signal processing; Confirmatory factor analysis; dereverberation; early acoustic transfer functions; Estimation; joint diagonalization; Mathematical model; microphone arrays; microphone-self noise; Microphones; multimicrophone; multimicrophone signal model parameters; Noise measurement; parameter estimation; power spectral densities; reverberation; Reverberation; robust method; signal-model parameters; source separation; speech enhancement; Time-frequency analysis; transfer functions", } @Article{Cauchi:2019:NIS, author = "B. Cauchi and K. Siedenburg and J. F. Santos and T. H. Falk and S. Doclo and S. Goetze", title = "Non-Intrusive Speech Quality Prediction Using Modulation Energies and {LSTM}-Network", journal = j-IEEE-ACM-TASLP, volume = "27", number = "7", pages = "1151--1163", month = jul, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2912123", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic conditions; Acoustic measurements; Acoustics; benchmark intrusive measures; clean speech signal; intrusive measures; listening tests; long short-term memory cells; LSTM-network; Modulation; modulation; modulation energy; modulation energy features; non-intrusive prediction; nonintrusive measures; nonintrusive speech quality prediction; perceived speech quality; perceptual measures; perceptual speech quality; perceptually evaluated signals; Prediction algorithms; recurrent neural nets; recurrent neural network; reference signal; reverberation; signal processing algorithms; Signal processing algorithms; signal-based measures; speech enhancement; Speech enhancement; speech enhancement algorithm settings; speech enhancement algorithms; Speech quality", } @Article{Zhang:2019:TIN, author = "Y. Zhang and P. Zhang and Y. Yan", title = "Tailoring an Interpretable Neural Language Model", journal = j-IEEE-ACM-TASLP, volume = "27", number = "7", pages = "1164--1178", month = jul, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2913087", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "architectural structure; autoregressive moving average; autoregressive moving average processes; CNNs; component interpretability; convolutional neural nets; convolutional neural networks; Feature extraction; History; interpretability; interpretable neural language model; language modeling datasets; language modeling task; learning (artificial intelligence); learning method; Mathematical model; Neural language models; parameterized auto-regressive moving average model; Penn Treebank; prediction interpretability; Predictive models; recurrent neural nets; recurrent neural networks; Recurrent neural networks; RNNs; short-term memory LMs; speech recognition; switchboard speech recognition task; Task analysis; typical neural LMs; WikiText-2 datasets", } @Article{Pandey:2019:NFC, author = "A. Pandey and D. Wang", title = "A New Framework for {CNN}-Based Speech Enhancement in the Time Domain", journal = j-IEEE-ACM-TASLP, volume = "27", number = "7", pages = "1179--1188", month = jul, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2913512", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "CNN-based speech enhancement; Convolution; convolutional neural nets; convolutional neural network; Convolutional neural networks; deep learning; Fourier transforms; frequency domain loss; Frequency-domain analysis; fully convolutional neural network; learning (artificial intelligence); mean absolute error; mean absolute error loss; Noise measurement; noisy utterance; short-time Fourier transform magnitude; speech enhancement; Speech enhancement; Task analysis; time domain; time domain enhancement; Time-domain analysis; time-frequency masking", } @Article{Vikram:2019:DNV, author = "C. M. Vikram and N. Adiga and S. R. M. Prasanna", title = "Detection of Nasalized Voiced Stops in Cleft Palate Speech Using Epoch-Synchronous Features", journal = j-IEEE-ACM-TASLP, volume = "27", number = "7", pages = "1189--1200", month = jul, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2913089", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "and velopharyngeal dysfunction; cepstral analysis; Cleft palate; cleft palate speech; consonant-vowel transitions; CP speech; Databases; epoch synchronous features; epochs; feature extraction; Feature extraction; glottal activity; hidden Markov models; Mel-frequency cepstral coefficients; nasal consonants; nasalized voiced stops; Production; single pole filter; speech processing; Speech processing; speech recognition; support vector machines; Surgery; Time-frequency analysis; time-frequency representation", } @Article{Luo:2019:IAT, author = "H. Luo and T. Li and B. Liu and B. Wang and H. Unger", title = "Improving Aspect Term Extraction With Bidirectional Dependency Tree Representation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "7", pages = "1201--1212", month = jul, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2913094", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Aspect term extraction; aspect term extraction problem; aspect-based sentiment analysis; benchmark SemEval datasets; bidirectional dependency tree network; bidirectional dependency tree representation; BiLSTM plus CRF; bottom-up propagation; Browsers; Computer architecture; dependency structure feature extraction; dependency syntactic tree; dependency tree structure representation; directional propagation; embedded representations; end-to-end framework; Feature extraction; feature extraction; learning (artificial intelligence); Logic gates; natural language processing; recursive neural network; sentiment analysis; sequential features; Software; Syntactics; Task analysis; top-down propagation; tree data structures; tree-structured features", } @Article{Anonymous:2019:ISPn, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "7", pages = "C3--C3", month = jul, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2917346", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCn, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "27", number = "8", pages = "C1--1213", month = aug, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2917338", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:ISPo, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "8", pages = "C2--C2", month = aug, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2917340", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2019:TCo, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "27", number = "8", pages = "1214--1215", month = aug, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2917342", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2019:CLF, author = "T. Zhang and J. Wu", title = "Constrained Learned Feature Extraction for Acoustic Scene Classification", journal = j-IEEE-ACM-TASLP, volume = "27", number = "8", pages = "1216--1228", month = aug, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2913091", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic scene classification; Acoustics; adaptive machine learning; Computational modeling; constrained learned feature extraction; convolutional neural network; Deep neural networks; deep neural networks; discrete Fourier transform; discrete Fourier transforms; Discrete Fourier transforms; feature extraction; Fourier transform; fully connected neural network; graphics processing unit; Graphics processing units; image classification; learning (artificial intelligence); neural nets; Neural networks; recurrent neural network; signal processing; signal processing procedure; simulated Fourier transform module; Task analysis; temporal transformer module", } @Article{Gabrielli:2019:MSA, author = "L. Gabrielli and S. Tomassetti and S. Squartini and C. Zinato and S. Guaiana", title = "A Multi-Stage Algorithm for Acoustic Physical Model Parameters Estimation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "8", pages = "1229--1240", month = aug, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2914530", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic physical model parameter estimation; acoustic signal; acoustic signal processing; computational acoustics; Computational modeling; computational sound design; computational sound design approach; deep learning approach; iterative optimization; learning (artificial intelligence); Measurement; multistage algorithm; musical acoustics; musical instruments; Neural networks; neural networks; optimisation; Parameter estimation; parameter estimation; perceptually motivated objective cost functions; Physics-based acoustic modeling; pipe organ tones; sound design process time; stochastic optimization method; Stochastic processes; stochastic processes; Timbre; timbre matching; time to market", } @Article{Yang:2019:MSS, author = "B. Yang and H. Liu and C. Pang and X. Li", title = "Multiple Sound Source Counting and Localization Based on {TF}-Wise Spatial Spectrum Clustering", journal = j-IEEE-ACM-TASLP, volume = "27", number = "8", pages = "1241--1255", month = aug, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2915785", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal detection; acoustic signal processing; adverse acoustic environments; correlation methods; enhanced TF-wise spatial spectra; Histograms; iterative methods; matrix algebra; microphone array recordings; Microphone arrays; microphone arrays; multiple sound source counting; multiple sound source localization; pattern clustering; received sensor signals; Reliability; remaining global spatial spectrum; Reverberation; signal denoising; signal subspace; Source counting; source detection; source presence possibility; spatial correlation matrix; spatial spectrum assignment; TF domain; TF-wise spatial spectrum; TF-wise spatial spectrum clustering; time-frequency analysis; Time-frequency analysis; time-frequency wise spatial spectrum clustering based method; unassigned spatial spectra", } @Article{Luo:2019:CTS, author = "Y. Luo and N. Mesgarani", title = "{Conv-TasNet}: Surpassing Ideal Time Frequency Magnitude Masking for Speech Separation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "8", pages = "1256--1266", month = aug, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2915167", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Conv-TasNet system; Convolution; Decoding; Deep learning; deep learning; deep learning framework; end-to-end time-domain speech separation; fully convolutional time-domain audio separation network; ideal time-frequency magnitude masking; learning (artificial intelligence); linear codes; linear decoder; linear encoder; mixed signal; modified encoder representations; objective distortion measures; real-time; real-time speech separation applications; real-world speech processing technologies; signal representation; single-channel; single-channel speaker-independent speech separation methods; Source separation; source separation; speaker separation; Spectrogram; spectrograms; speech coding; Speech processing; speech separation systems; speech signal; speech waveform; speech waveform representation; stacked one-dimensional dilated convolutional blocks; subjective quality assessment; temporal convolutional network; three-speaker mixtures; time-domain; Time-domain analysis; time-frequency analysis; Time-frequency analysis; time-frequency representation; two-speaker speech separation; weighting functions", } @Article{Sarkar:2019:TCL, author = "A. K. Sarkar and Z. Tan and H. Tang and S. Shon and J. Glass", title = "Time-Contrastive Learning Based Deep Bottleneck Features for Text-Dependent Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "27", number = "8", pages = "1267--1279", month = aug, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2915322", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "automatic speech recognition systems; BN feature extraction method; BN features; bottleneck feature; brain; brain signals; brain states; cepstral analysis; Clustering methods; deep bottleneck features; deep neural networks; DNNs; DNNs discriminating speakers; Feature extraction; feature extraction; fixed pass-phrases; Gaussian processes; GMM-UBM; image segmentation; learned features; learning (artificial intelligence); Mel frequency cepstral coefficient; multiframe segments; neural nets; nonstationarity property; pattern clustering; Phonetics; segment-based unsupervised clustering algorithm; short-time cepstral features; speaker recognition; speaker verification; speech data; speech frames; Speech recognition; speech signals; speech utterance; TCL BN feature; TCL-BN; TCL-DNNs; text-dependent speaker verification; time contrastive learning concept; time-contrastive features; time-contrastive learning; Training; training dataset", } @Article{Chua:2019:LLA, author = "J. Chua and W. B. Kleijn", title = "A Low Latency Approach for Blind Source Separation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "8", pages = "1280--1294", month = aug, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2916360", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "blind source separation; Blind source separation; BSS algorithms; Delays; demixing parameter estimation; Estimation; long algorithmic delay; long analysis window; low latency; low latency approach; Matrix decomposition; microphones; Microphones; Microsoft Windows; parameter estimation; separation performance; subspace; time domain; Time-domain analysis; time-frequency analysis; Time-frequency analysis; time-frequency domain; traditional BSS approaches; window length", } @Article{Pan:2019:DTB, author = "C. Pan and J. Chen and J. Benesty and G. Shi", title = "On the Design of Target Beampatterns for Differential Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "27", number = "8", pages = "1295--1307", month = aug, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2918081", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic application; acoustic signal processing; Acoustics; ADMM algorithm; alternating-direction-method-of-multipliers algorithm; array signal processing; Array signal processing; audio application; classical target beampatterns; differential beamformer; differential beamforming; differential beamforming filter; differential microphone arrays; Differential microphone arrays; differential sound pressure field; effective beampattern; microphone arrays; Microphone arrays; optimisation; positive superposition theorem; Pressure measurement; resulting beampattern; Roads; speech application; Speech processing; target beampattern; target DMA; useful DMA target beampatterns", } @Article{Azmi:2019:RWE, author = "A. M. Azmi and M. N. Almutery and H. A. Aboalsamh", title = "Real-Word Errors in {Arabic} Texts: a Better Algorithm for Detection and Correction", journal = j-IEEE-ACM-TASLP, volume = "27", number = "8", pages = "1308--1320", month = aug, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2918404", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib; https://www.math.utah.edu/pub/tex/bib/spell.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Arabic language; arabic OCR; Arabic text; computational linguistics; confusion sets-a simple approach; context-sensitive; context-sensitive errors; correction phase; correctly spelled word; corrects real-word errors; detection phase; Dictionaries; dyslexic text; learning (artificial intelligence); natural language processing; optical character recognition; Optical character recognition software; real-word error words; Real-word errors; semantic errors; Semantics; Speech processing; spelling error; statistical language model; stem n-gram; Syntactics; Testing; text analysis; Training; typical spell checker", } @Article{Korpusik:2019:DLD, author = "M. Korpusik and J. Glass", title = "Deep Learning for Database Mapping and Asking Clarification Questions in Dialogue Systems", journal = j-IEEE-ACM-TASLP, volume = "27", number = "8", pages = "1321--1334", month = aug, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2918618", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "convolutional neural nets; convolutional neural network; convolutional neural network models; crowdsourcing; database mapping; Databases; deep reinforcement learning; deep RL; dialogue system; entropy; entropy-based methods; Games; hybrid RL model; interactive systems; learning (artificial intelligence); natural language interfaces; natural language processing; natural language representations; natural language user queries; Natural languages; nutrition domain; query languages; query processing; Reinforcement learning; RL agent; rule-based method; semantic embedding; Semantics; Speech processing; standard feature engineering; structured database entries; Task analysis; text analysis; text mismatch", } @Article{Pak:2019:SLB, author = "J. Pak and J. W. Shin", title = "Sound Localization Based on Phase Difference Enhancement Using Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "27", number = "8", pages = "1335--1345", month = aug, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2919378", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic generators; acoustic radiators; background noise; classical sound source localization algorithms degrades; clean source signal estimation; deep neural networks; direction-of-arrival; Direction-of-arrival estimation; direction-of-arrival estimation; directional signals; DNN-based phase difference enhancement; DoA estimation; dry source signal estimation; end-fire directions; Estimation; estimation theory; input interchannel phase differences; interchannel phase difference; IPD enhancement; Microphones; neural nets; Noise measurement; reverberation; Reverberation; room impulse responses; Sound source localization; Speech enhancement", } @Article{Anonymous:2019:ISPp, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "8", pages = "C3--C3", month = aug, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2917344", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ali:2019:MEG, author = "R. Ali and G. Bernardi and T. {van Waterschoot} and M. Moonen", title = "Methods of Extending a Generalized Sidelobe Canceller With External Microphones", journal = j-IEEE-ACM-TASLP, volume = "27", number = "9", pages = "1349--1364", month = sep, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2918400", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "beamforming; blocking matrix; eigenvalues and eigenfunctions; External Microphone; GSC; GSC-LMA; LMA-based generalized sidelobe canceller; local microphone array; matrix algebra; Microphone arrays; microphone arrays; microphone spacings; Multi-Microphone Noise Reduction; Noise reduction; noise reduction; rank-1 generalized eigenvalue decomposition; relative transfer function; Speech Enhancement; speech enhancement; Speech enhancement; speech enhancement; speech estimate; Wireless communication; Wireless sensor networks", } @Article{Li:2019:MOD, author = "X. Li and L. Girin and S. Gannot and R. Horaud", title = "Multichannel Online Dereverberation Based on Spectral Magnitude Inverse Filtering", journal = j-IEEE-ACM-TASLP, volume = "27", number = "9", pages = "1365--1377", month = sep, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2919183", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Adaptation models; channel identification; complex-valued CTF convolution model; Convolution; convolutive transfer function; cross-relation method; filtering theory; Fourier transforms; gradient descent criterion; gradient methods; Indexes; inverse filtering; inverse filters; least squares approximations; microphones; Microphones; multichannel CTF; multichannel equalization; multichannel online dereverberation; multiple-input/output inverse theorem; nonnegative convolution model; Online speech dereverberation; online STFT magnitude inverse filtering method; recursive least square criterion; Reverberation; reverberation; short-time Fourier transform domain; spectral magnitude inverse filtering; speech enhancement; Speech processing; speech recognition; STFT domain; time-domain analysis; Time-domain analysis; time-domain room impulse response", } @Article{Chen:2019:ATU, author = "L. Chen and Z. Chen and B. Tan and S. Long and M. Ga{\v{s}}i{\'c} and K. Yu", title = "{AgentGraph}: Toward Universal Dialogue Management With Structured Deep Reinforcement Learning", journal = j-IEEE-ACM-TASLP, volume = "27", number = "9", pages = "1378--1391", month = sep, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2919872", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "AgentGraph framework; AgentGraph models; Computational modeling; deep models; deep reinforcement learning; dialogue domain ontology; Dialogue policy; DRL-based algorithm; DRL-based policies; dual GNN-based dialogue policy; GNN based architecture; graph neural network based architecture; graph neural networks; graph theory; high-level global decision; interactive systems; learning (artificial intelligence); low-level local decision; multi-agent systems; multiagent reinforcement learning; neural nets; Neural networks; Ontologies; ontologies (artificial intelligence); Optimization; policy adaptation; policy optimization; policy transfer; PyDial benchmark; Reinforcement learning; structured deep reinforcement learning; Task analysis; task-oriented spoken dialogue systems; Training; transfer learning; universal dialogue management", } @Article{Li:2019:RCK, author = "L. Li and J. Wang and J. Li and Q. Ma and J. Wei", title = "Relation Classification via Keyword-Attentive Sentence Mechanism and Synthetic Stimulation Loss", journal = j-IEEE-ACM-TASLP, volume = "27", number = "9", pages = "1392--1404", month = sep, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2921726", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Adaptation models; attention mechanism; attention mechanisms; bidirectional gated recurrent unit; BiGRU; Feature extraction; imbalanced classification; imbalanced classification problem; Kernel; keyword-attentive sentence mechanism; learning (artificial intelligence); loss function; mutual learning; natural language processing; Neural networks; pattern classification; Relation classification; relation classification; Semantics; SemEval-2010 Task 8 data set; shortest dependency path; SSL-KAS-MuBiGRU; Syntactics; synthetic stimulation loss; TAC40 data set; Task analysis", } @Article{Moller:2019:ITF, author = "M. B. M{\o}ller and J. K. Nielsen and E. Fernandez-Grande and S. K. Olesen", title = "On the Influence of Transfer Function Noise on Sound Zone Control in a Room", journal = j-IEEE-ACM-TASLP, volume = "27", number = "9", pages = "1405--1418", month = sep, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2921151", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic field; acoustic leakage; Acoustic measurements; acoustic separation; acoustic signal processing; Acoustics; active eigenfunctions; audio signal processing; frequency 20.0 Hz to 300.0 Hz; headphones; high separation; in situ transfer function measurements; individual audio content; inherent noise; loudspeakers; Loudspeakers; measurement noise; microphones; Microphones; multiple loudspeakers; multiple people; Noise measurement; personal audio; rectangular room; Sensitivity; sound field control; sound reproduction; sound zone control; sound zone methods; Sound zones; target sound field; transfer function noise; Transfer functions; transfer functions", } @Article{Xu:2019:DWM, author = "Z. Xu and C. Sun and Y. Long and B. Liu and B. Wang and M. Wang and M. Zhang and X. Wang", title = "Dynamic Working Memory for Context-Aware Response Generation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "9", pages = "1419--1431", month = sep, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2915922", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Context modeling; context representation; context-aware response generation; contextual utterances; conversation context modeling; conversational agents; customer services; Decoding; deep learning; dialog context; dynamic working memory mechanism; encoder-decoder architecture; History; human evaluation; human-to-human conversations; interactive programming; interactive systems; Memory management; Memory modules; OpenSubtitles Corpus; Response generation; semantic interactions; Semantics; social networking (online); Speech processing; Twitter customer service corpus; ubiquitous computing", } @Article{Kameoka:2019:AVN, author = "H. Kameoka and T. Kaneko and K. Tanaka and N. Hojo", title = "{ACVAE-VC}: Non-Parallel Voice Conversion With Auxiliary Classifier Variational Autoencoder", journal = j-IEEE-ACM-TASLP, volume = "27", number = "9", pages = "1432--1443", month = sep, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2917232", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic feature sequences; Acoustics; ACVAE-VC; Artificial neural networks; attribute class label input; auxiliary classifier VAE; auxiliary classifier VAE (ACVAE); auxiliary classifier variational autoencoder; conditional variational autoencoder; convolutional architectures; decoder output networks; Decoding; decoding; fully convolutional network; Gallium nitride; Generators; information-theoretic regularization; learning (artificial intelligence); non-parallel VC; nonparallel VC systems; nonparallel voice conversion process; open-source parallel VC system; regular conditional VAE; speaker identity conversion task; speech coding; Speech recognition; trained encoder; Training; variational autoencoder (VAE); Voice conversion (VC)", } @Article{Chen:2019:EFW, author = "X. Chen and X. Liu and Y. Wang and A. Ragni and J. H. M. Wong and M. J. F. Gales", title = "Exploiting Future Word Contexts in Neural Network Language Models for Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "27", number = "9", pages = "1444--1454", month = sep, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2922048", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "bi-directional model; Computational modeling; Context modeling; feedforward; feedforward unit; History; keyword search; language model; language modeling; Lattices; natural language processing; neural network language model structure; probability; probability distributions; recurrent neural nets; Recurrent neural network; recurrent neural network LMs; Speech processing; speech recognition; Speech recognition; su-RNNLM; succeeding words; succeeding-word RNNLM; Training; word lattices", } @Article{Wang:2019:DBT, author = "R. Wang and Z. Chen and F. Yin", title = "{DOA}-Based Three-Dimensional Node Geometry Calibration in Acoustic Sensor Networks and Its {Cram{\'e}r--Rao} Bound and Sensitivity Analysis", journal = j-IEEE-ACM-TASLP, volume = "27", number = "9", pages = "1455--1468", month = sep, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2921892", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "3D rotation matrices; ABC algorithm; Acoustic sensor network; acoustic sensor networks; artificial bee colony algorithm; ASN geometry calibration; calibration; Calibration; concave programming; Cost function; Cram{\'e}r Rao bound; Cram{\'e}r-Rao bound; direction of arrival; Direction-of-arrival estimation; direction-of-arrival estimation; directional of arrival measurements; DOA-based node geometry calibration; DOA-based three-dimensional node geometry calibration; Estimation; geometric structure; geometry; Geometry; irregular geometric structures; matrix algebra; microphones; Microphones; minimisation; node geometry calibration; node geometry calibration method; node geometry calibration problem; node geometry positions; non-convex minimization; sensitivity analysis; sound source position error; theoretical DOAs; Three-dimensional displays; three-dimensional node geometry calibration approach; time-difference-of-arrival; tracking speakers; wireless sensor networks", } @Article{Lee:2019:MCS, author = "C. Lee and H. Lee and S. Wu and C. Liu and W. Fang and J. Hsu and B. Tseng", title = "Machine Comprehension of Spoken Content: {TOEFL} Listening Test and Spoken {SQuAD}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "9", pages = "1469--1480", month = sep, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2913499", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "academic English examination; attention model; Cognition; computer aided instruction; deep learning; English learners; Knowledge discovery; listening comprehension task; listening comprehension test; machine comprehension; native English speakers; natural language processing; neural nets; second listening comprehension task; Speech processing; Speech question answering; speech recognition; Speech recognition; spoken content; spoken SQuAD; SQuAD; Task analysis; text content; TOEFL; Videos; Visualization", } @Article{Chen:2019:AWS, author = "Y. Chen and S. Huang and H. Lee and Y. Wang and C. Shen", title = "Audio {Word2vec}: Sequence-to-Sequence Autoencoding for Unsupervised Learning of Audio Segmentation and Representation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "9", pages = "1481--1493", month = sep, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2922832", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustics; audio segmentation; audio signal processing; Audio word2Vec; Decoding; natural language processing; phonetic information; Phonetics; Recurrent neural networks; reinforcement learning; SA vector representations; segmental audio word2vec; sequence-to-sequence autoencoder; sequence-to-sequence autoencoding; signal representation; speaker information; speech processing; Speech recognition; Task analysis; Training; unannotated audio word2vec; unsupervised learning; unsupervised spoken word boundary segmentation; word level", } @Article{Li:2019:SAE, author = "P. Li and C. Chen and W. Zheng and Y. Deng and F. Ye and Z. Zheng", title = "{STD}: an Automatic Evaluation Metric for Machine Translation Based on Word Embeddings", journal = j-IEEE-ACM-TASLP, volume = "27", number = "10", pages = "1497--1506", month = oct, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2922845", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Earth; earth mover's distance; embedded n-grams; language translation; lexical-based metrics; Linguistics; machine translation; Machine translation evaluation; Measurement; metric; MT automatic evaluation; n-gram; natural language processing; NIST; semantic; semantic features; semantic relationships; semantic travel distance; Semantics; Speech processing; STD; Syntactics; word embeddings; word order", } @Article{Zhang:2019:RAT, author = "J. Zhang and R. Heusdens and R. C. Hendriks", title = "Relative Acoustic Transfer Function Estimation in Wireless Acoustic Sensor Networks", journal = j-IEEE-ACM-TASLP, volume = "27", number = "10", pages = "1507--1519", month = oct, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2923542", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic communication (telecommunication); audio recording; audio recordings; bit rate; convex optimization; convex programming; Correlation; correlation methods; covariance analysis; Covariance matrices; covariance subtraction; covariance subtraction method; covariance whitening; covariance whitening approach; CS-based methods; data records; eigenvalues and eigenfunctions; estimated RTF accuracy; Estimation; estimation performance; expected estimation error; generalized eigenvalue decomposition; greedy rate-distribution methods; matrix algebra; Matrix decomposition; Microphones; minimisation; model-based methods; model/data-driven rate distribution; Noise measurement; noisy correlation matrix; numerical analysis; numerical simulations; optimal rate distributions; power usage; power usage minimization; quantization; Quantization (signal); rate-distributed CW methods; relative acoustic transfer function estimation; relative transfer function; RTF estimation accuracy; Sensor networks; telecommunication power management; transfer functions; uniform rate allocation; WASN; wireless acoustic sensor networks; wireless sensor networks", } @Article{Park:2019:SSM, author = "J. Park and J. Chang", title = "State-Space Microphone Array Nonlinear Acoustic Echo Cancellation Using Multi-Microphone Near-End Speech Covariance", journal = j-IEEE-ACM-TASLP, volume = "27", number = "10", pages = "1520--1534", month = oct, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2923969", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustic arrays; acoustic signal processing; acoustic transfer function vector; approximation theory; array signal processing; ATF vector estimation; echo reduction; echo suppression; Eigenvalue decomposition; Kalman filter; Kalman filters; linear acoustic path; loudspeaker; loudspeakers; Low-rank approximation; low-rank approximation; microphone array NAEC algorithm; Microphone array nonlinear acoustic echo cancellation; Microphone arrays; microphone arrays; Multi-microphone near-end speech covariance; multimicrophone near-end speech covariance; multimicrophone Wiener filtering; near-end speech quality; Nonlinear acoustics; nonlinear acoustics; Parameterized multi-microphone Wiener filter; power series; recursive estimation; residual echo; reverberant condition; reverberation; SER; Signal processing algorithms; signal-to-echo ratio; single-microphone nonlinear AEC algorithm; single-microphone-based model; Speech processing; speech processing; state-space equation; state-space methods; state-space microphone array nonlinear acoustic echo cancellation; State-space modeling; transfer functions; Wiener filters", } @Article{Luo:2019:EVC, author = "Z. Luo and J. Chen and T. Takiguchi and Y. Ariki", title = "Emotional Voice Conversion Using Dual Supervised Adversarial Networks With Continuous Wavelet Transform {F0} Features", journal = j-IEEE-ACM-TASLP, volume = "27", number = "10", pages = "1535--1548", month = oct, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2923951", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic features; acoustic signal processing; adaptive scales continuous wavelet transform; ADS-CWT method; continuous wavelet transform F0 features; Continuous wavelet transforms; dual supervised adversarial networks; dual supervised learning; emotion recognition; emotional VC experiments; emotional VC task; Emotional voice conversion; emotional voice conversion tasks; emotional voice representation; feature extraction; generative adversarial networks; Hidden Markov models; labeled emotional voice; learning (artificial intelligence); low-level data space; neutral voice; over-smoothing problem; prosodic aspects; speech processing; Supervised learning; Task analysis; temporal levels; Training; training performance improvement; wavelet transform; wavelet transforms", } @Article{Asad:2019:RTL, author = "H. As'ad and M. Bouchard and H. Kamkar-Parsi", title = "A Robust Target Linearly Constrained Minimum Variance Beamformer With Spatial Cues Preservation for Binaural Hearing Aids", journal = j-IEEE-ACM-TASLP, volume = "27", number = "10", pages = "1549--1563", month = oct, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2924321", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; anechoic propagation; anechoic reverberant environments; array signal processing; Array signal processing; background noise; binaural beamforming algorithm; binaural cues preservations; binaural hearing aids; complex realistic acoustic scenarios; direction of arrival estimation; direction-of-arrival estimation; Direction-of-arrival estimation; directional interferers directions; Estimation; Hearing aids; hearing aids; higher order statistics; Microphones; mildly reverberant environments; noise reduction; Noise reduction; noise-only components; post-processor; propagation model mismatch; reverberation; Robust LCMV; robust target linearly constrained minimum variance beamformer; robust TLCMV; second-order statistics; simulated directional signals; spatial cues preservation; speech processing; steering vector mismatch; target distortion; target signal; target speaker direction", } @Article{Wang:2019:SSN, author = "Y. Wang and Y. Xia and L. Zhao and J. Bian and T. Qin and E. Chen and T. Liu", title = "Semi-Supervised Neural Machine Translation via Marginal Distribution Estimation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "10", pages = "1564--1576", month = oct, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2921423", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Computational modeling; Data models; Decoding; Mathematical model; natural language processing; Neural machine translation; Neural networks; semi-supervised learning; Task analysis; Training", } @Article{Jati:2019:NPC, author = "A. Jati and P. Georgiou", title = "Neural Predictive Coding Using Convolutional Neural Networks Toward Unsupervised Learning of Speaker Characteristics", journal = j-IEEE-ACM-TASLP, volume = "27", number = "10", pages = "1577--1589", month = oct, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2921890", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Convolutional Neural Networks (CNN); Neural networks; Predictive coding; siamese network; Speaker recognition; speaker recognition; Speaker-specific characteristics; Speech processing; Speech recognition; Task analysis; Training; unsupervised learning", } @Article{Fontana:2019:NRS, author = "F. Fontana and E. Bozzo", title = "{Newton--Raphson} Solution of Nonlinear Delay-Free Loop Filter Networks", journal = j-IEEE-ACM-TASLP, volume = "27", number = "10", pages = "1590--1600", month = oct, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2924842", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "basin of convergence; Computational modeling; Convergence; Digital delay-free loop; diode clipper; Integrated circuit modeling; Mathematical model; Modulation; Newton method; Newton-Raphson method; nonlinear filter network; ring modulator; Tools; virtual analogue", } @Article{Makishima:2019:IDL, author = "N. Makishima and S. Mogami and N. Takamune and D. Kitamura and H. Sumino and S. Takamichi and H. Saruwatari and N. Ono", title = "Independent Deeply Learned Matrix Analysis for Determined Audio Source Separation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "10", pages = "1601--1615", month = oct, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2925450", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Audio source separation; Covariance matrices; Data models; deep neural networks; Estimation; independent component analysis; Power capacitors; semi-supervised learning; Source separation; Spectrogram; Time-frequency analysis", } @Article{Prakash:2019:AIP, author = "J. J. Prakash and H. A. Murthy", title = "Analysis of Inter-Pausal Units in {Indian} Languages and Its Application to Text-to-Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "27", number = "10", pages = "1616--1628", month = oct, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2924534", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Databases; Gamma distribution; gamma distribution; Hidden Markov models; Inter-pausal unit; IPU-based TTSes; Machine learning; number of syllables; phrasing; Speech processing; Syntactics; Training", } @Article{Lan:2019:KBQ, author = "Y. Lan and S. Wang and J. Jiang", title = "Knowledge Base Question Answering With a Matching-Aggregation Model and Question-Specific Contextual Relations", journal = j-IEEE-ACM-TASLP, volume = "27", number = "10", pages = "1629--1638", month = oct, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2926125", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Artificial intelligence; Context modeling; knowledge base question answering; Knowledge based systems; Knowledge discovery; natural language processing; Natural languages; Neural networks; Semantics; Task analysis", } @Article{Bai:2019:BAA, author = "X. Bai and H. Cao and K. Chen and T. Zhao", title = "A Bilingual Adversarial Autoencoder for Unsupervised Bilingual Lexicon Induction", journal = j-IEEE-ACM-TASLP, volume = "27", number = "10", pages = "1639--1648", month = oct, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2925973", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "bilingual lexicon induction; Computational modeling; Correlation; Decoding; Dictionaries; Speech processing; Training; Transforms; unsupervised word mapping; Word embeddings", } @Article{Zhao:2019:UPP, author = "G. Zhao and R. Gutierrez-Osuna", title = "Using Phonetic Posteriorgram Based Frame Pairing for Segmental Accent Conversion", journal = j-IEEE-ACM-TASLP, volume = "27", number = "10", pages = "1649--1660", month = oct, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2926754", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Accent conversion; acoustic model; Acoustics; Computational modeling; Phonetics; posteriorgram; Signal processing algorithms; Speech processing; Training; Trajectory; voice conversion", } @Article{Zhang:2019:ESS, author = "Z. Zhang and H. Zhao and K. Ling and J. Li and Z. Li and S. He and G. Fu", title = "Effective Subword Segmentation for Text Comprehension", journal = j-IEEE-ACM-TASLP, volume = "27", number = "11", pages = "1664--1674", month = nov, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2922537", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Linguistics; machine reading comprehension; Robot sensing systems; Semantics; Speech processing; Subword embedding; Task analysis; textual entailment; word segmentation", } @Article{Xie:2019:SEC, author = "Y. Xie and R. Liang and Z. Liang and C. Huang and C. Zou and B. Schuller", title = "Speech Emotion Classification Using Attention-Based {LSTM}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "11", pages = "1675--1685", month = nov, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2925934", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "attention mechanism; frame-level features; LSTM; Speech emotion", } @Article{Wang:2019:DNE, author = "S. Wang and Z. Huang and Y. Qian and K. Yu", title = "Discriminative Neural Embedding Learning for Short-Duration Text-Independent Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "27", number = "11", pages = "1686--1696", month = nov, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2928128", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Analytical models; angular softmax; center loss; Feature extraction; Linear discriminant analysis; Neural networks; Optimization; Short-duration text-independent speaker verification; speaker neural embedding; Speech processing; Training; triplet loss", } @Article{Lu:2019:AVD, author = "R. Lu and Z. Duan and C. Zhang", title = "Audio Visual Deep Clustering for Speech Separation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "11", pages = "1697--1712", month = nov, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2928140", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 3 09:10:28 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "audio-visual fusion; deep clustering; Hidden Markov models; Lips; Robustness; Speaker-independent speech separation; Spectrogram; Speech processing; Training; Visualization", } @Article{Ueno:2019:TDS, author = "N. Ueno and S. Koyama and H. Saruwatari", title = "Three-Dimensional Sound Field Reproduction Based on Weighted Mode-Matching Method", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "1852--1867", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2934834", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic field; acoustic signal processing; array geometries; directivities; exterior sound field reproduction; Geometry; Harmonic analysis; interior reproduction; loudspeakers; Loudspeakers; Minimization; Mode-matching method; multizone reproduction; numerical analysis; optimal driving signals; optimal weight; reproduction accuracy; sound field reproduction; sound field reproduction method; sound field synthesis; sound reproduction; Speech processing; spherical wavefunction expansion; Three-dimensional displays; three-dimensional sound field reproduction; Two dimensional displays; weighted mode-matching method", } @Article{Wu:2019:BEP, author = "L. Wu and X. Tan and T. Qin and J. Lai and T. Liu", title = "Beyond Error Propagation: Language Branching Also Affects the Accuracy of Sequence Generation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "1868--1879", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2933727", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "abstractive summarization; accuracy drop; accuracy drop problem; autoregressive training; Decoding; error propagation; error propagation problem; language characteristic; language modeling; left-branching language; Linguistics; Maximum likelihood estimation; Measurement; natural language processing; neural machine translation; Sequence generation; sequence generation task; sequence generation tasks; Speech processing; Task analysis; text analysis; Training", } @Article{Das:2019:AAW, author = "A. Das and J. Li and G. Ye and R. Zhao and Y. Gong", title = "Advancing Acoustic-to-Word {CTC} Model With Attention and Mixed-Units", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "1880--1892", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2933325", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic-to-word; acoustic-to-word CTC model; Acoustics; attention; attention modeling; complex decoder; connectionist temporal classification criterion; Context modeling; context weighted inputs; CTC; CTC network; Data models; Decoding; E2E system; end-to-end system; frequent words; frequently occurring words; hard alignment issue; hybrid CTC; learning (artificial intelligence); letter CTC; Microsoft Cortana voice assistant task; mixed-unit CTC; multiletter units; OOV; OOV issue; OOV words; out-of-vocabulary issue; recurrent neural nets; Recurrent neural networks; self-attention CTC; shared hidden layers; speech coding; speech recognition; Training; Training data; vanilla word CTC; vocabulary; word error rate; word tagging; word-based CTC model", } @Article{Antonello:2019:JAL, author = "N. Antonello and E. {De Sena} and M. Moonen and P. A. Naylor and T. {van Waterschoot}", title = "Joint Acoustic Localization and Dereverberation Through Plane Wave Decomposition and Sparse Regularization", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "1893--1905", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2933047", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic model; acoustic signal processing; acoustic source localization; Acoustics; Approximation algorithms; dereverberated signals; Dereverberation; diffuse noise; direction of arrival; Direction-of-arrival estimation; direction-of-arrival estimation; DOA; Estimation; first order optimization algorithm; inverse problem; inverse problems; Inverse problems; inverse problems; joint acoustic localization and dereverberation; large-scale optimization problem; localized noise; microphone positions; microphones; Microphones; moving sound source; noise reduction; optimisation; Optimization; plane wave decomposition; reverberation; signal denoising; sound field; sound pressure; source localization; source separation; sparse regularization; sparse sensing; spatiospectral sparsity; spectral analysis; speech processing; weight signals; weighted overlap-add procedure", } @Article{Borra:2019:ULA, author = "F. Borra and A. Bernardini and F. Antonacci and A. Sarti", title = "Uniform Linear Arrays of First-Order Steerable Differential Microphones", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "1906--1918", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2934567", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "array signal processing; Array signal processing; audio signal processing; Beamforming; beamforming method; delay-and-sum beamformer; design methodologies; differential microphones; directivity factor; filtering layers; first-order steerable differential microphones; FOSDMs; Geometry; microphone arrays; Microphone arrays; Sensor arrays; single scalar parameter; spatial filtering method; spatial filters; traditional spatial filtering techniques; two-layer spatial filter; uniform linear arrays; White noise; white noise; white noise gain", } @Article{Chai:2019:UGG, author = "L. Chai and J. Du and Q. Liu and C. Lee", title = "Using Generalized {Gaussian} Distributions to Improve Regression Error Modeling for Deep Learning-Based Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "1919--1931", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2935803", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "assumed homoscedastic Gaussian error model; clean log-power spectral components; consistent improvements; conventional DNN framework; conventional minimum; conventional MMSE criterion; deep learning-based speech enhancement; deep neural network; DNN input vectors; DNN outputs; Gaussian distribution; Gaussian processes; generalized Gaussian distribution; generalized Gaussian distributions; GGD error model; heteroscedastic properties; improved generalization; learning (artificial intelligence); least mean squares methods; Linear programming; maximum likelihood estimation; maximum likelihood solution; mean square error methods; ML criterion; ML optimization objective; neural nets; noise; noisy LPS features; nonlinear regression deep neural network-based speech enhancement; prediction error modeling; prediction error vector; prediction errors; Predictive models; regression analysis; regression error modeling; robustness; speech enhancement; Speech enhancement; speech processing; squared error criterion; statistical analysis; statistical perspective; statistically independent random variables; super-Gaussian properties; Task analysis; Training", } @Article{Qi:2019:TDN, author = "J. Qi and J. Du and S. M. Siniscalchi and C. Lee", title = "A Theory on Deep Neural Network Based Vector-to-Vector Regression With an Illustration of Its Expressive Power in Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "1932--1943", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2935891", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "ANN structures; ANN-based regression function; artificial neural network; Biological neural networks; broader hidden layer; Computer architecture; deep neural network; Deep neural network; deeper architecture; expected clean speech; expressive power; function approximation; functional approximation; hidden layers; log power spectra; neural nets; Noise measurement; noisy expected clean speech; recently-emerged DNN based speech enhancement; regression analysis; regression performance; signal-to-noise-ratio levels; Speech enhancement; speech enhancement; Task analysis; top hidden layer; universal approximation; vector-to-vector regression; vector-to-vector regression functions; vectors", } @Article{Dang:2019:IMS, author = "X. Dang and Q. Cheng and H. Zhu", title = "Indoor Multiple Sound Source Localization via Multi-Dimensional Assignment Data Association", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "1944--1956", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2935837", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; Arrays; association costs; data association; direction of arrival; Direction-of-arrival estimation; direction-of-arrival estimation; Estimation; false alarm-originated subsets; false alarms; Feature extraction; indoor environments; indoor multiple sound source localization; microphone arrays; Microphone arrays; missed detections; multidimensional assignment data association; multidimensional assignment-based data association approach; multiple microphone arrays; Multiple sound source localization; multiple sound source localization problem; multisource scenarios; optimal associations; Position measurement; sensor fusion; source-originated DOA estimates; target tracking", } @Article{Schneider:2019:IDD, author = "M. Schneider and E. A. P. Habets", title = "Iterative {DFT}-Domain Inverse Filter Optimization Using a Weighted Least-Squares Criterion", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "1957--1969", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2936385", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "approximation algorithms; Digital filters; discrete Fourier transform domain; discrete Fourier transforms; Discrete Fourier transforms; effective regularization method; finite impulse response filters; Finite impulse response filters; FIR filters; frequency-domain analysis; Frequency-domain analysis; frequency-domain weight; iterative DFT-domain inverse filter optimization; iterative methods; jointly optimized filter coefficients; least squares approximation; least squares approximations; least-squares-optimal filter coefficients; Mathematical model; optimisation; Optimization; regularization parameters; sound-zones scenario; Speech processing; Time-domain analysis; time-domain analysis; time-domain filter coefficients; time-domain weights; weighted least-squares criterion", } @Article{Chen:2019:NMT, author = "K. Chen and R. Wang and M. Utiyama and E. Sumita and T. Zhao", title = "Neural Machine Translation With Sentence-Level Topic Context", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "1970--1984", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2937190", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Computer architecture; Context modeling; Convolution; convolution neural network; convolutional neural nets; Convolutional Neural Network; Decoding; English-to-German translation tasks; Feature extraction; language translation; Latent Topic Representation; latent topic representations; LDC Chinese-to-English translation tasks; natural language processing; Neural Machine Translation; neural machine translation methods; Sentence-level Context; sentence-level context; source sentence-level topic context information; Speech processing; statistical machine translation; target language translation; Task analysis; topic attention; transformer-based NMT; translation prediction; word-level context", } @Article{Gomez-Alanis:2019:GRC, author = "A. Gomez-Alanis and A. M. Peinado and J. A. Gonzalez and A. M. Gomez", title = "A Gated Recurrent Convolutional Neural Network for Robust Spoofing Detection", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "1985--1999", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2937413", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "anti-spoofing techniques; antispoofing system; ASV; automatic speaker verification systems; clean scenarios; Convolutional neural networks; deep feature extractor; deep features; deep learning; Feature extraction; feature extraction; gated recurrent convolutional neural networks; input spectral features; Logic gates; logical access attacks; logical scenarios; Noise measurement; noise robustness; noisy conditions; noisy environments; physical scenarios; recurrent neural nets; robust spoofing detection; Robustness; signal-to-noise masks; speaker recognition; speaker verification; Speech processing; speech signals; spoofing attacks; Spoofing detection; Training; utterance-level embeddings", } @Article{Feng:2019:ECL, author = "S. Feng and T. Lee", title = "Exploiting Cross-Lingual Speaker and Phonetic Diversity for Unsupervised Subword Modeling", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2000--2011", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2937953", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic modeling; Acoustics; across-speaker triphone minimal-pair; Adaptation models; automatic speech recognition systems; Clustering algorithms; cross-lingual speaker; deep neural networks; feature learning; frame clustering; frame-level labels; Hidden Markov models; high-quality frame labels; individual target languages; learning (artificial intelligence); low-resource languages; MTL-DNN; multi-task learning; multilingual bottleneck features; multitask learning; neural nets; out-of-domain ASR systems; out-of-domain languages; phonetic diversity; resource-rich; robust BNF representations; robust features; robust frame-level feature representations; speaker adaptation; Speech processing; speech recognition; subword-level speech units; supervised DNN training; target language; Task analysis; Training; training data; training speech; transcribed speech data; transcribed training data; unsupervised learning; unsupervised subword modeling; untranscribed training data; Zero resource", } @Article{Li:2019:IMD, author = "W. Li and N. F. Chen and S. M. Siniscalchi and C. Lee", title = "Improving Mispronunciation Detection of {Mandarin} Tones for Non-Native Learners With Soft-Target Tone Labels and {BLSTM}-Based Deep Tone Models", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2012--2024", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2936755", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustics; BLSTM-based verifiers; canonical tone categories; Computer-assisted language learning (CALL); computer-assisted pronunciation training (CAPT); Context modeling; Data mining; deep learning; Feature extraction; hard target labels; hard targets; Hidden Markov models; L2 learners; language learners whose first language; Mandarin lexical tones; mispronunciation detection; natural language processing; neural nets; non-native tone modeling and mispronunciation detection; nonnative learners; nonnative tone productions; pattern classification; Production; segmental tone features; sequential context information; short-term memory network; soft targets; soft-target tone labels; speech processing; Speech processing; speech recognition; tone posteriors; tone-level co-articulation; train binary classifiers; trained tone models", } @Article{Tu:2019:MOF, author = "Q. Tu and H. Chen", title = "On Mainlobe Orientation of the First- and Second-Order Differential Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2025--2040", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2937192", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; Acoustics; array signal processing; Differential microphone array; first order DMA; first-order differential microphone arrays; fixed endfire direction; Gain; lower-order differential microphone arrays; mainlobe orientation; Microphone arrays; microphone arrays; microphone mismatches; second-order differential microphone arrays; second-order DMA; Sensitivity; Speech processing; Tolerance analysis; tolerance analysis", } @Article{Chorowski:2019:USR, author = "J. Chorowski and R. J. Weiss and S. Bengio and A. {van den Oord}", title = "Unsupervised Speech Representation Learning Using {WaveNet} Autoencoders", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2041--2053", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2938863", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; acoustic unit discovery; Autoencoder; autoencoder models; autoencoding neural networks; Decoding; discrete vector quantized VAE; Feature extraction; Gaussian processes; Gaussian variational autoencoder; high capacity WaveNet decoder; high level semantic content; latent representation; latent representations; learning (artificial intelligence); low level details; neural nets; Neural networks; phoneme identities; phonetic content; Phonetics; pitch contour; Prototypes; simple dimensionality reduction bottleneck; speech processing; Speech processing; speech representation learning; speech waveforms; Task analysis; unsupervised extraction; unsupervised learning; unsupervised speech representation; vector quantisation; VQ-VAE; WaveNet autoencoders; ZeroSpeech 2017 unsupervised acoustic unit discovery task", } @Article{Varanasi:2019:NFA, author = "V. Varanasi and A. Agarwal and R. M. Hegde", title = "Near-Field Acoustic Source Localization Using Spherical Harmonic Features", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2054--2066", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2939782", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; Acoustics; Array signal processing; array signal processing; beamforming; convolutional neural nets; convolutional neural network; direction independent features; direction of arrival estimation; Direction-of-arrival estimation; direction-of-arrival estimation; Estimation; Feature extraction; Harmonic analysis; interpolation; learning (artificial intelligence); learning- based framework; Microphones; near-field acoustic source localization; Near-field beamforming; near-held DOA estimation; pressure distribution; range estimation; reverberant conditions; Root mean square error; signal invariant features; source signal strength; spatial pressure interpolation; spherical harmonic domain; spherical harmonic features; spherical microphone array; voice activity detection; voicing activity detection; Wigner-D functions", } @Article{Zheng:2019:FBD, author = "Y. Zheng and J. Tao and Z. Wen and J. Yi", title = "Forward Backward Decoding Sequence for Regularizing End-to-End {TTS}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2067--2079", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2935807", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustics; Decoding; decoding; directional models; divergence regularization terms; encoder-decoder with attention; end-to-end; English; Forward-backward; forward-backward decoding sequence; joint training method; joint-training; learning (artificial intelligence); Linguistics; Mandarin; model training; regularization; regularizing end-to-end TTS; regularizing neural end-to-end TTS; speech coding; Speech processing; Speech recognition; speech synthesis; Tacotron; target generation; Training; TTS", } @Article{Tu:2019:SEB, author = "Y. Tu and J. Du and C. Lee", title = "Speech Enhancement Based on Teacher Student Deep Learning Using Improved Speech Presence Probability for Noise-Robust Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2080--2091", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2940662", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Adaptation models; BGRU-equipped student model; bidirectional gated recurrent units; causal processing mode; CHiME-4 challenge task; complex noncausal teacher model; Computational modeling; deep learning based speech enhancement; deep neural network; error statistics; IMCRA; improved minima controlled recursive averaging; improved speech presence probability; IRM-based deep learning method; learning (artificial intelligence); neural nets; noise; Noise measurement; noise-robust speech recognition; nonlinear interactions; online noise tracking; ratio masks; regression-based enhancement model; relative WER reduction; speech enhancement; Speech enhancement; speech enhancement; Speech recognition; speech recognition; teacher-student deep learning; Teacher-student learning; Training; word error rate", } @Article{Liu:2019:DCD, author = "Y. Liu and D. Wang", title = "Divide and Conquer: A Deep {CASA} Approach to Talker-Independent Monaural Speaker Separation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2092--2102", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2941148", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "acoustic signal processing; audio databases; computational auditory scene analysis; deep CASA; deep CASA approach; deep learning; Deep learning; divide and conquer; divide and conquer methods; frame-level separated spectra; frame-level separation; Image analysis; Indexes; learning (artificial intelligence); Monaural speech separation; multispeaker separation task; neural nets; Neural networks; Noise measurement; optimisation; pattern clustering; permutation-invariantly trained neural network; sequential grouping; simultaneous grouping; speaker recognition; speaker separation; speaker tracking; speech processing; Speech processing; talker-independent monaural speaker separation; Training; WSJ0-2mix database", } @Article{Liu:2019:LAB, author = "X. Liu and D. F. Wong and L. S. Chao and Y. Liu", title = "Latent Attribute Based Hierarchical Decoder for Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2103--2112", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2941587", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "attribute level; Computational modeling; Decoding; decoding; decoding process; decoding time; dynamic hierarchical decoder; English-German translation tasks; hierarchical decoder; language translation; Latent attribute; latent attribute vectors; learning (artificial intelligence); limited vocabulary; linguistic attributes; Linguistics; natural language processing; neural machine translation; neural machine translation (NMT); NMT baselines; Semantics; Speech processing; target word; Training; translation quality; Vocabulary; word vector", } @Article{Hu:2019:EFS, author = "J. Hu and N. Chen", title = "Enhanced Feature Summarizing for Effective Cover Song Identification", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2113--2126", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2942157", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustic measurements; audio signal processing; combined representative feature; cover song identification; Cover Song Identification (CSI); cross-similarity calculating stage; cross-similarity calculating strategies; Feature extraction; feature extraction; feature subsequence community; Feature Summarizing; feature summarizing stage; gene-function prediction accuracy; Hubness Reduction (HR); Hubness Reduction strategy; Hubness' phenomenon; identification accuracy; information retrieval; melody perception-based similarity; memory efficiency; music; Music; Network Enhancement (NE); Network Enhancement technique; Noise measurement; performance enhancement; retrieval effectiveness; self-similarity analysis-based feature; Self-Similarity Matrix (SSM); self-similarity network; Speech processing; statistical analysis; SuCo model; summarized representative feature subsequences; Thumb; unsummarized feature sequence", } @Article{Ma:2019:GLM, author = "Q. Ma and L. Yu and S. Tian and E. Chen and W. W. Y. Ng", title = "Global-Local Mutual Attention Model for Text Classification", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2127--2139", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2942160", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Computational modeling; Convolutional Neural Network (CNN); discriminative features; feature extraction; Feature extraction; global long-term dependencies; global-guided local-attention; global-local mutual attention model; informative features; key local semantic information; learning (artificial intelligence); local-guided global-attention; mutual attention mechanism; Mutual Attention Mechanism; mutual attention weights; mutual learning; natural language processing; Natural language processing; pattern classification; Recurrent Neural Network (RNN); Recurrent neural networks; relevant local semantic features; Semantics; Task analysis; text analysis; Text Classification; text classification problems; Visualization; Weighted-over-time Pooling; weighted-over-time pooling operation", } @Article{Vlimki:2019:NCG, author = "V. V{\"a}lim{\"a}ki and J. R{\"a}m{\"o}", title = "Neurally Controlled Graphic Equalizer", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2140--2149", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2935809", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Audio systems; Bandwidth; equalisers; Equalizers; equalizers; feedforward neural nets; feedforward neural network based method; feedforward neural networks; filter gain control; filtering theory; Gain; gain control; Graphics; IIR filters; learning (artificial intelligence); least-square design method; matrix inversion; music processing applications; neurally controlled graphic equalizer; neurocontrollers; noise figure 0.1 dB; Optimization; optimized band filter gain coefficients; Speech processing; supervised learning; telecommunication control; ten-octave graphic equalization design; time-varying equalization", } @Article{Wood:2019:BCB, author = "S. U. N. Wood and J. K. W. Stahl and P. Mowlaee", title = "Binaural Codebook-Based Speech Enhancement With Atomic Speech Presence Probability", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2150--2161", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2937174", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "ASPP estimators; ASPP-based speech enhancement algorithms; atomic speech presence probability; binaural codebook-based speech enhancement; binaural cue preservation; binaural cues; binaural mixtures; binaural noise reduction; Binaural speech enhancement; binaural speech enhancement benchmark methods; binaural STOI metrics; Estimation; given codebook atom; Indexes; interaural coherence magnitude; interaural phase; interaural transfer function; ITF-based ASPP approach; level difference; Noise measurement; Noise reduction; nonnegative matrix factorization; objective speech quality; PESQ metrics; probability; reverberant speech; reverberation; signal denoising; single codebook; speech coding; Speech coding; Speech enhancement; speech enhancement; speech intelligibility; transfer functions; universal codebook-based speech enhancement framework", } @Article{Pfeifenberger:2019:EBS, author = "L. Pfeifenberger and M. Z{\"o}hrer and F. Pernkopf", title = "Eigenvector-Based Speech Mask Estimation for Multi-Channel Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2162--2172", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2941592", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustics; Array signal processing; array signal processing; CHiME4 corpora; Direction-of-arrival estimation; eigennet architecture; eigenvalues and eigenfunctions; Eigenvector beamforming; eigenvector features; eigenvector-based speech mask estimation; estimation theory; filtering theory; generalized eigenvalue beamformers; GEV; Kaldi speech-to-text API; microphones; Microphones; minimum variance distortionless response; Multi-channel speech enhancement; multichannel microphone observations; multichannel speech enhancement; MVDR; Neural Networks; Noise measurement; PAN postfilter; phase aware normalization postfilter; Signal to noise ratio; SNR; Speech enhancement; speech enhancement; speech mask estimation; WER; word error rate; WSJ0 corpora", } @Article{Arnela:2019:MBV, author = "M. Arnela and S. Dabbaghchian and O. Guasch and O. Engwall", title = "{MRI}-Based Vocal Tract Representations for the Three-Dimensional Finite Element Synthesis of Diphthongs", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2173--2182", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2942439", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "3D dynamic vocal tract representations; acoustic wave propagation; acoustic waves; adaptive grid; adjacent cross-sections; Au; biomedical MRI; cross-section orientations; diphthongs; finite element analysis; Finite element analysis; Finite Element Method; Geometry; Interpolation; magnetic resonance imaging; Magnetic resonance imaging; mixed wave equation; MRI-based vocal tract geometries; MRI-based vocal tract representations; semi-polar grid; semi-polar grid strategy; Shape; Solid modeling; spatial resolution; speech; speech processing; speech synthesis; SPG dynamic vocal tract representation; static sounds; static vowel sounds; Three-dimensional displays; three-dimensional finite element synthesis; Vocal tract acoustics; vocal tract midline; wave equations", } @Article{Sekiguchi:2019:SSM, author = "K. Sekiguchi and Y. Bando and A. A. Nugraha and K. Yoshii and T. Kawahara", title = "Semi-Supervised Multichannel Speech Enhancement With a Deep Speech Prior", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2197--2212", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2944348", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Data models; deep learning; Maximum likelihood estimation; Multichannel speech enhancement; Noise measurement; nonnegative matrix factorization; Probabilistic logic; Speech enhancement; Time-frequency analysis; variational autoencoder", } @Article{Guo:2019:LRL, author = "Q. Guo and X. Qiu and X. Xue and Z. Zhang", title = "Low-Rank and Locality Constrained Self-Attention for Sequence Modeling", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2213--2222", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2944078", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Bit error rate; Data models; deep learning; Linguistics; Matrix decomposition; Natural language processing; self-attention; Sequence modeling; Sparse matrices; Task analysis; transformer", } @Article{Yu:2019:STP, author = "J. Yu and Q. Ling and C. Luo and C. W. Chen", title = "Synthesizing {$3$D} {Trump}: Predicting and Visualizing the Relationship Between Text, Speech, and Articulatory Movements", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2223--2233", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2935843", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustics; Animation; Feature extraction; Head; Linguistics; speech animation; Three-dimensional displays; Visual co-articulation; Visualization", } @Article{Sugiura:2019:SCD, author = "R. Sugiura and Y. Kamamoto and T. Moriya", title = "Shape Control of Discrete Generalized {Gaussian} Distributions for Frequency-Domain Audio Coding", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2234--2248", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2945843", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Audio compression; Computational modeling; entropy coding; generalized Gaussian distribution; Laplace equations; Psychoacoustic models; Shape; Speech coding; Speech processing", } @Article{Ben-Hur:2019:ERS, author = "Z. Ben-Hur and D. L. Alon and R. Mehra and B. Rafaely", title = "Efficient Representation and Sparse Sampling of Head-Related Transfer Functions Using Phase-Correction Based on Ear Alignment", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2249--2262", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2945479", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Ear; Finite wordlength effects; Frequency-domain analysis; head-related transfer functions (HRTFs); Interpolation; Spatial audio; Spatial resolution; Speech processing; spherical-harmonics; Transfer functions", } @Article{Remaggi:2019:MCF, author = "L. Remaggi and P. J. B. Jackson and W. Wang", title = "Modeling the Comb Filter Effect and Interaural Coherence for Binaural Source Separation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2263--2277", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2946043", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "binaural audio; Coherence; comb filter effect; ILD; Integrated circuit modeling; interaural coherence; IPD; multipath propagation; Reverberation; RIRs; Source separation; Speech processing", } @Article{Zhang:2019:FAK, author = "B. Zhang and D. Xiong and J. Su and J. Luo", title = "Future-Aware Knowledge Distillation for Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2278--2287", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2946480", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Computational modeling; Context modeling; Decoding; Future context; History; knowledge distillation; natural language processing; neural machine translation; Predictive models; Semantics; Training", } @Article{Ali:2019:IPE, author = "R. Ali and T. {Van Waterschoot} and M. Moonen", title = "Integration of a Priori and Estimated Constraints Into an {MVDR} Beamformer for Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2288--2300", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2946086", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Acoustic distortion; Acoustics; Beamforming; Correlation; Microphone arrays; Minimum Variance Distortionless Response (MVDR) Beamformer; Multi-Microphone Noise Reduction; Speech Enhancement; Speech enhancement; Tuning", } @Article{Tiwari:2019:SEU, author = "N. Tiwari and P. C. Pandey", title = "Speech Enhancement Using Noise Estimation With Dynamic Quantile Tracking", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2301--2312", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2945485", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Dynamic quantile tracking; Estimation; hearing aids; Indexes; Microsoft Windows; noise estimation; Noise measurement; Smoothing methods; speech communication devices; speech enhancement; Speech enhancement", } @Article{Duan:2019:TTD, author = "J. Duan and X. Ding and Y. Zhang and T. Liu", title = "{TEND}: A Target-Dependent Representation Learning Framework for News Document", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2313--2325", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2947364", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Document Representation; Internet; Logic gates; Neural networks; Speech processing; Stance Detection; Stock Market Prediction; Target-dependent Representation; Task analysis; Text mining; Twitter", } @Article{Zhao:2019:SLD, author = "L. Zhao and X. Qiu and Q. Zhang and X. Huang", title = "Sequence Labeling With Deep Gated Dual Path {CNN}", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2326--2335", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2944563", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Context modeling; convolutional neural networks; Hidden Markov models; Labeling; Logic gates; Natural language processing; recurrent neural networks; Recurrent neural networks; Sequence labeling; Task analysis", } @Article{Kato:2019:SRM, author = "A. Kato and T. H. Kinnunen", title = "Statistical Regression Models for Noise Robust {F0} Estimation Using Recurrent Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2336--2349", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2945489", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Estimation; F0; Fundamental frequency; Hidden Markov models; Noise robustness; pitch; Recurrent neural networks; recurrent neural networks; regression model; Speech processing; Task analysis; waveform-to-sinusoid regression", } @Article{Liu:2019:BBF, author = "D. Liu and J. Fu and Q. Qu and J. Lv", title = "{BFGAN}: Backward and Forward Generative Adversarial Networks for Lexically Constrained Sentence Generation", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2350--2361", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2943018", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "Force; Gallium nitride; generative adversarial networks; Generators; Lexically constrained sentence generation; natural language generation; Natural languages; Search problems; Task analysis; Training", } @Article{Marafioti:2019:CEA, author = "A. Marafioti and N. Perraudin and N. Holighaus and P. Majdak", title = "A Context Encoder For Audio Inpainting", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2362--2372", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2947232", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "frequency-domain analysis; Image reconstruction; Instruments; machine learning; Music; Prediction algorithms; Psychoacoustic models; Reliability; signal processing algorithms; Time-domain analysis", } @Article{Yang:2019:EOS, author = "J. Yang and R. K. Das and N. Zhou", title = "Extraction of Octave Spectra Information for Spoofing Attack Detection", journal = j-IEEE-ACM-TASLP, volume = "27", number = "12", pages = "2373--2384", month = dec, year = "2019", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2946897", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Fri Nov 29 16:54:01 2019", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", keywords = "constant-Q multi-level coefficients (CMC); Data mining; Discrete cosine transforms; Feature extraction; High frequency; Mel frequency cepstral coefficient; Multi-level transform (MLT); replay speech detection; synthetic speech detection", } @Article{Amini:2020:RCN, author = "Jamal Amini and Richard Christian Hendriks and Richard Heusdens and Meng Guo and Jesper Jensen", title = "Rate-Constrained Noise Reduction in Wireless Acoustic Sensor Networks", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "1--12", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2947777", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2947777", abstract = "Wireless acoustic sensor networks (WASNs) can be used for centralized multi-microphone noise reduction, where the processing is done in a fusion center (FC). To perform the noise reduction, the data needs to be transmitted to the FC. Considering the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gupta:2020:ALE, author = "Chitralekha Gupta and Haizhou Li and Ye Wang", title = "Automatic Leaderboard: Evaluation of Singing Quality Without a Standard Reference", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "13--26", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2947737", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2947737", abstract = "Automatic evaluation of singing quality can be done with the help of a reference singing or the digital sheet music of the song. However, such a standard reference is not always available. In this article, we propose a framework to rank a large pool of \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Eskimez:2020:NRT, author = "Sefik Emre Eskimez and Ross K. Maddox and Chenliang Xu and Zhiyao Duan", title = "Noise-Resilient Training Method for Face Landmark Generation From Speech", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "27--38", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2947741", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2947741", abstract = "Visual cues such as lip movements, when available, play an important role in speech communication. They are especially helpful for the hearing impaired population or in noisy environments. When not available, having a system to automatically generate \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2020:BGB, author = "Peidong Wang and Ke Tan and De Liang Wang", title = "Bridging the Gap Between Monaural Speech Enhancement and Recognition With Distortion-Independent Acoustic Modeling", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "39--48", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2946789", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2946789", abstract = "Monaural speech enhancement has made dramatic advances since the introduction of deep learning a few years ago. Although enhanced speech has been demonstrated to have better intelligibility and quality for human listeners, feeding it directly to automatic \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mitsufuji:2020:MNN, author = "Yuki Mitsufuji and Stefan Uhlich and Norihiro Takamune and Daichi Kitamura and Shoichi Koyama and Hiroshi Saruwatari", title = "Multichannel Non-Negative Matrix Factorization Using Banded Spatial Covariance Matrices in Wavenumber Domain", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "49--60", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2948770", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2948770", abstract = "Blind source separation exploiting multichannel information has long been a popular topic, and recently proposed methods based on the local Gaussian model have shown promising results despite its high computational cost for the case of many microphone \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Laufer:2020:SBM, author = "Yaron Laufer and Sharon Gannot", title = "Scoring-Based {ML} Estimation and {CRBs} for Reverberation, Speech, and Noise {PSDs} in a Spatially Homogeneous Noise Field", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "61--76", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2948794", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2948794", abstract = "Hands-free speech systems are subject to performance degradation due to reverberation and noise. Common methods for enhancing reverberant and noisy speech require the knowledge of the speech, reverberation and noise power spectral densities (PSDs). Most \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Desiraju:2020:OER, author = "Naveen Kumar Desiraju and Simon Doclo and Markus Buck and Tobias Wolff", title = "Online Estimation of Reverberation Parameters For Late Residual Echo Suppression", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "77--91", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2948765", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2948765", abstract = "In hands-free telephony and other distant-talk applications, often a short AEC filter is used to achieve fast convergence at low computational cost. As a result, a significant amount of late residual echo (LRE) may remain, especially in highly reverberant \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zohourian:2020:BDR, author = "Mehdi Zohourian and Rainer Martin", title = "Binaural Direct-to-Reverberant Energy Ratio and Speaker Distance Estimation", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "92--104", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2948730", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2948730", abstract = "This article addresses the problem of distance estimation using binaural hearing aid microphones in reverberant rooms. Among several distance indicators, the direct-to-reverberant energy ratio (DRR) has been shown to be more effective than other features. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shin:2020:LCU, author = "Youhyun Shin and Sang-goo Lee", title = "Learning Context Using Segment-Level {LSTM} for Neural Sequence Labeling", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "105--115", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2948773", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2948773", abstract = "This article introduces an approach that learns segment-level context for sequence labeling in natural language processing (NLP). Previous approaches limit their basic unit to a word for feature extraction because sequence labeling is a token-level task \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Huang:2020:DPD, author = "Gongping Huang and Jingdong Chen and Jacob Benesty", title = "Design of Planar Differential Microphone Arrays With Fractional Orders", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "116--130", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2949219", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2949219", abstract = "Differential microphone arrays (DMAs) often encounter white noise amplification, especially at low frequencies. If the array geometry and the number of microphones are fixed, one can improve the white noise amplification problem by reducing the DMA order. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Su:2020:ABR, author = "Ming-Hsiang Su and Chung-Hsien Wu and Liang-Yu Chen", title = "Attention-Based Response Generation Using Parallel Double {Q}-Learning for Dialog Policy Decision in a Conversational System", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "131--143", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2949687", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2949687", abstract = "This article proposes an approach to response generation using a Parallel Double Q-learning algorithm for dialog policy decision in a conversational system. First, a new semantic representation of the user\&\#x0027;s input sentence is presented by using the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Emura:2020:WDR, author = "Satoru Emura", title = "Wave-Domain Residual Echo Reduction Using Subspace Tracking", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "144--156", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2949709", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2949709", abstract = "This article proposes a wave-domain residual echo reduction method for two-way immersive sound communication, which is based on wave field synthesis and uses uniform linear arrays of loudspeakers and microphones. This method is intended to improve the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2020:VQV, author = "Xin Wang and Shinji Takaki and Junichi Yamagishi and Simon King and Keiichi Tokuda", title = "A Vector Quantized Variational Autoencoder {(VQ-VAE)} Autoregressive Neural {$ F_0 $} Model for Statistical Parametric Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "157--170", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2950099", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2950099", abstract = "Recurrent neural networks (RNNs) can predict fundamental frequency (F0) for statistical parametric speech synthesis systems, given linguistic features as input. However, these models assume conditional independence between consecutive \ldots{}.", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hoffmann:2020:DEP, author = "Falk-Martin Hoffmann and Philip Arthur Nelson and Filippo Maria Fazi", title = "{DOA} Estimation Performance With Circular Arrays in Sound Fields With Finite Rate of Innovation", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "171--184", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2950774", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2950774", abstract = "A novel Direction-of-Arrival (DOA) estimation method based on a plane wave sound field model was recently proposed for circular microphone arrays\&\#x00A0;{$<$}xref ref-type=``bibr'' rid=``ref1''{$>$}[1]{$<$}/{xref$>$}. This article presents a detailed theoretical analysis of \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Su:2020:CDD, author = "Rongfeng Su and Xunying Liu and Lan Wang and Jingzhou Yang", title = "Cross-Domain Deep Visual Feature Generation for {Mandarin} Audio--Visual Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "185--197", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2950602", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2950602", abstract = "There has been a long term interest in using visual information to improve automatic speech recognition (ASR) system performance. Both audio and visual information are required in conventional audio visual speech recognition (AVSR) systems. This limits \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Parcollet:2020:RHS, author = "Titouan Parcollet and Mohamed Morchid and Xavier Bost and Georges Linar{\`e}s and Renato {De Mori}", title = "Real to {H}-Space Autoencoders for Theme Identification in Telephone Conversations", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "198--210", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2950596", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2950596", abstract = "Machine learning (ML) and deep learning with deep neural networks (DNN), have drastically improved the performances of modern systems on numerous spoken language understanding (SLU) related tasks. Since most of current researches focus on new neural \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Canclini:2020:MRE, author = "Antonio Canclini and Fabio Antonacci and Stefano Tubaro and Augusto Sarti", title = "A Methodology for the Robust Estimation of the Radiation Pattern of Acoustic Sources", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "211--224", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2950767", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2950767", abstract = "We propose a novel methodology for estimating the radiation pattern of acoustic sources, which is general enough as to be suitable for a wide variety of sources without the need of anechoic conditions of operation. Multiple plenacoustic cameras (which can \ldots{}).", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yu:2020:EBN, author = "Yi Yu and Hongsen He and Badong Chen and Jianghui Li and Youwen Zhang and Lu Lu", title = "{$M$}-Estimate Based Normalized Subband Adaptive Filter Algorithm: Performance Analysis and Improvements", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "225--239", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2950597", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2950597", abstract = "This article studies the mean and mean-square behaviors of the M-estimate based normalized subband adaptive filter algorithm (M-NSAF) with robustness against impulsive noise. Based on the contaminated-Gaussian noise model, the stability condition, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wen:2020:PUA, author = "Hao-Xiang Wen and Sen-Quan Yang and Yuan-Quan Hong and Huan Luo", title = "A Partial Update Adaptive Algorithm for Sparse System Identification", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "240--255", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2949928", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2949928", abstract = "A sparse partial update (SPU) algorithm and its improved version improved SPU (ISPU) algorithm, are proposed in this paper for sparse system identification. The SPU first categorizes its filter coefficients into active and inactive coefficients. Then all \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Moller:2020:MHF, author = "Martin Bo M{\o}ller and Jan {\O}stergaard", title = "A Moving Horizon Framework for Sound Zones", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "256--265", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2951995", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2951995", abstract = "Sound zones are generated to provide independent audio reproduction to multiple people in the same room using loudspeakers. In this article, sound zones are formulated in terms of a moving horizon framework. This framework allows the reproduction scenario \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mimilakis:2020:EMF, author = "Stylianos Ioannis Mimilakis and Konstantinos Drossos and Estefan{\'\i}a Cano and Gerald Schuller", title = "Examining the Mapping Functions of Denoising Autoencoders in Singing Voice Separation", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "266--278", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2952013", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2952013", abstract = "The goal of this article is to investigate what singing voice separation approaches based on neural networks learn from the data. We examine the mapping functions of neural networks based on the denoising autoencoder (DAE) model that are conditioned on \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Birnie:2020:RAS, author = "Lachlan I. Birnie and Thushara D. Abhayapala and Prasanga N. Samarasinghe", title = "Reflection Assisted Sound Source Localization Through a Harmonic Domain {MUSIC} Framework", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "279--293", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2953000", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2953000", abstract = "This work presents a method that persuades acoustic reflections to be a favorable property for sound source localization. Whilst most real world spatial audio applications utilize prior knowledge of sound source position, estimating such positions in \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ding:2020:AMS, author = "Wenhao Ding and Liang He", title = "Adaptive Multi-Scale Detection of Acoustic Events", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "294--306", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2953350", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2953350", abstract = "The goal of acoustic (or sound) events detection (AED or SED) is to predict the temporal position of target events in given audio segments. This task plays a significant role in safety monitoring, acoustic early warning and other scenarios. However, the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2020:TSD, author = "Weijian Zhang and Peng Song", title = "Transfer Sparse Discriminant Subspace Learning for Cross-Corpus Speech Emotion Recognition", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "307--318", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2955252", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2955252", abstract = "Cross-corpus speech emotion recognition has attracted much attention due to the widespread existence of various emotional speech in life. It takes one corpus for training and another corpus for testing, and generally involves the following two basic \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sharma:2020:AES, author = "Bidisha Sharma and Ye Wang", title = "Automatic Evaluation of Song Intelligibility Using Singing Adapted {STOI} and Vocal-Specific Features", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "319--331", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2955253", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2955253", abstract = "An objective machine-driven measure of song intelligibility would be of great utility for various music information retrieval tasks. Song intelligibility mostly depends on two factors, the amount of interference caused by background accompaniment, and the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Morgenstern:2020:PTO, author = "Hai Morgenstern and Boaz Rafaely", title = "Perceptually-Transparent Online Estimation of Two-Channel Room Transfer Function for Sound Calibration", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "332--342", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2955286", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2955286", abstract = "Sound calibration is employed in many commercial audio systems for improving sound quality. This process includes the estimation of the room transfer function (RTF) between each loudspeaker and a microphone located at the listeners\&\#x2019; position. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ding:2020:LSS, author = "Shaojin Ding and Guanlong Zhao and Christopher Liberatore and Ricardo Gutierrez-Osuna", title = "Learning Structured Sparse Representations for Voice Conversion", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "343--354", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2955289", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2955289", abstract = "Sparse-coding techniques for voice conversion assume that an utterance can be decomposed into a sparse code that only carries linguistic contents, and a dictionary of atoms that captures the speakers\&\#x2019; characteristics. However, conventional \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Diez:2020:ASD, author = "Mireia Diez and Luk{\'a}{\v{s}} Burget and Federico Landini and Jan {\v{C}}ernock{\'y}", title = "Analysis of Speaker Diarization Based on {Bayesian} {HMM} With Eigenvoice Priors", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "355--368", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2955293", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2955293", abstract = "In our previous work, we introduced our Bayesian Hidden Markov Model with eigenvoice priors, which has been recently recognized as the state-of-the-art model for Speaker Diarization. In this article we present a more complete analysis of the Diarization \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gu:2020:UUI, author = "Jia-Chen Gu and Zhen-Hua Ling and Quan Liu", title = "Utterance-to-Utterance Interactive Matching Network for Multi-Turn Response Selection in Retrieval-Based Chatbots", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "369--379", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2955290", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2955290", abstract = "This article proposes an utterance-to-utterance interactive matching network (U2U-IMN) for multi-turn response selection in retrieval-based chatbots. Different from previous methods following context-to-response matching or utterance-to-response matching \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tan:2020:LCS, author = "Ke Tan and DeLiang Wang", title = "Learning Complex Spectral Mapping With Gated Convolutional Recurrent Networks for Monaural Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "380--390", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2955276", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Sat Aug 15 09:50:40 MDT 2020", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/abs/10.1109/TASLP.2019.2955276", abstract = "Phase is important for perceptual quality of speech. However, it seems intractable to directly estimate phase spectra through supervised learning due to their lack of spectrotemporal structure in it. Complex spectral mapping aims to estimate the real and \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Duan:2020:CLT, author = "Richeng Duan and Tatsuya Kawahara and Masatake Dantsuji and Hiroaki Nanjo", title = "Cross-Lingual Transfer Learning of Non-Native Acoustic Modeling for Pronunciation Error Detection and Diagnosis", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "391--401", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2955858", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2955858", abstract = "In computer-assisted pronunciation training (CAPT), the scarcity of large-scale non-native corpora and human expert annotations are two fundamental challenges to non-native acoustic modeling. Most existing approaches of acoustic modeling in CAPT are based \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2020:NSF, author = "Xin Wang and Shinji Takaki and Junichi Yamagishi", title = "Neural Source-Filter Waveform Models for Statistical Parametric Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "402--415", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2956145", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2956145", abstract = "Neural waveform models have demonstrated better performance than conventional vocoders for statistical parametric speech synthesis. One of the best models, called WaveNet, uses an autoregressive (AR) approach to model the distribution of waveform sampling \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Parekh:2020:WSR, author = "Sanjeel Parekh and Slim Essid and Alexey Ozerov and Ngoc Q. K. Duong and Patrick P{\'e}rez and Ga{\"e}l Richard", title = "Weakly Supervised Representation Learning for Audio-Visual Scene Analysis", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "416--428", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2957889", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2957889", abstract = "Audio-visual (AV) representation learning is an important task from the perspective of designing machines with the ability to understand complex events. To this end, we propose a novel multimodal framework that instantiates multiple instance learning. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yu:2020:ESA, author = "Jianfei Yu and Jing Jiang and Rui Xia", title = "Entity-Sensitive Attention and Fusion Network for Entity-Level Multimodal Sentiment Classification", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "429--439", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2957872", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2957872", abstract = "Entity-level (aka target-dependent) sentiment analysis of social media posts has recently attracted increasing attention, and its goal is to predict the sentiment orientations over individual target entities mentioned in users\&\#x2019; posts. Most existing \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Beerends:2020:SOA, author = "John G. Beerends and Niels M. P. Neumann and Egon L. van den Broek and Anna Llagostera Casanovas and Jovana Torres Menendez and Christian Schmidmer and Jens Berger", title = "Subjective and Objective Assessment of Full Bandwidth Speech Quality", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "440--449", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2957871", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2957871", abstract = "With the introduction of fullband speech coding the question arises what role frequency components above 14\&\#x00A0;kHz play in speech quality assessment. On the one hand, our results show that bandwidth limitation from 24\&\#x00A0;kHz down to 14\&\#x00A0;kHz \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mathad:2020:VOP, author = "Vikram C. Mathad and S. R. Mahadeva Prasanna", title = "Vowel Onset Point Based Screening of Misarticulated Stops in Cleft Lip and Palate Speech", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "450--460", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2957887", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2957887", abstract = "The presence of velopharyngeal dysfunction, dental occlusion, and mislearned articulation in individuals with cleft lip and palate (CLP) results in the production of misarticulated stop consonants. The present work considers vowel onset points (VOPs) as \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nguyen:2020:HCE, author = "Minh Nguyen and Gia H. Ngo and Nancy F. Chen", title = "Hierarchical Character Embeddings: Learning Phonological and Semantic Representations in Languages of Logographic Origin Using Recursive Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "461--473", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2955246", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2955246", abstract = "Logographs (Chinese characters) have recursive structures (i.e. hierarchies of sub-units in logographs) that contain phonological and semantic information, as developmental psychology literature suggests that native speakers leverage on the structures to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cherkassky:2020:SRT, author = "Dani Cherkassky and Sharon Gannot", title = "Successive Relative Transfer Function Identification Using Blind Oblique Projection", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "474--486", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2957883", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2957883", abstract = "Distortionless speech extraction in a reverberant environment can be achieved by applying a beamforming algorithm, provided that the relative transfer functions (RTFs) of the sources and the covariance matrix of the noise are known. In this paper, the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Trowitzsch:2020:JSE, author = "Ivo Trowitzsch and Christopher Schymura and Dorothea Kolossa and Klaus Obermayer", title = "Joining Sound Event Detection and Localization Through Spatial Segregation", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "487--502", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2958408", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2958408", abstract = "Identification and localization of sounds are both integral parts of computational auditory scene analysis. Although each can be solved separately, the goal of forming coherent auditory objects and achieving a comprehensive spatial scene understanding \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mogami:2020:ILR, author = "Shinichi Mogami and Norihiro Takamune and Daichi Kitamura and Hiroshi Saruwatari and Yu Takahashi and Kazunobu Kondo and Nobutaka Ono", title = "Independent Low-Rank Matrix Analysis Based on Time-Variant Sub-{Gaussian} Source Model for Determined Blind Source Separation", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "503--518", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2959257", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2959257", abstract = "Independent low-rank matrix analysis (ILRMA) is a fast and stable method of blind audio source separation. Conventional ILRMAs assume time-variant (super-)Gaussian source models, which can only represent signals that follow a super-Gaussian distribution. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ghasemzadeh:2020:TOQ, author = "Hamzeh Ghasemzadeh and Meisam K. Arjmandi", title = "Toward Optimum Quantification of Pathology-Induced Noises: an Investigation of Information Missed by Human Auditory System", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "519--528", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2959222", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2959222", abstract = "Clinical diagnosis of voice disorder and evaluation of therapy outcome heavily rely on accurate quantification of voice quality, which is closely tied to the physiology and function of the laryngeal mechanism. Considering the evaluation methodology of the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ma:2020:ACO, author = "Fei Ma and Wen Zhang and Thushara Dheemantha Abhayapala", title = "Active Control of Outgoing Broadband Noise Fields in Rooms", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "529--539", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2960716", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2960716", abstract = "Active noise control system has been actively researched over the past half century, and implemented to reduce noises in ducts, headsets, and inside several automobile models. However, active control of noise fields, and specifically broadband noise \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2020:NPS, author = "Jing-Xuan Zhang and Zhen-Hua Ling and Li-Rong Dai", title = "Non-Parallel Sequence-to-Sequence Voice Conversion With Disentangled Linguistic and Speaker Representations", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "540--552", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2960721", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2960721", abstract = "This article presents a method of sequence-to-sequence (seq2seq) voice conversion using non-parallel training data. In this method, disentangled linguistic and speaker representations are extracted from acoustic features, and voice conversion is achieved \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dai:2020:ASD, author = "Tao Dai and Li Zhu and Yaxiong Wang and Kathleen M. Carley", title = "Attentive Stacked Denoising Autoencoder With {Bi-LSTM} for Personalized Context-Aware Citation Recommendation", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "553--568", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2949925", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2949925", abstract = "The rapid growth of scientific publications brings the problem of finding appropriate citations for authors. Context-aware citation recommendation is an essential technology to overcome this obstacle when given a fragment of manuscript. In this article, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nishimura:2020:MSN, author = "Yuta Nishimura and Katsuhito Sudoh and Graham Neubig and Satoshi Nakamura", title = "Multi-Source Neural Machine Translation With Missing Data", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "569--580", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2959224", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2959224", abstract = "Machine translation is rife with ambiguities in word ordering and word choice, and even with the advent of machine-learning methods that learn to resolve this ambiguity based on statistics from large corpora, mistakes are frequent. Multi-source \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2020:TSR, author = "Jin Wang and Liang-Chih Yu and K. Robert Lai and Xuejie Zhang", title = "Tree-Structured Regional {CNN-LSTM} Model for Dimensional Sentiment Analysis", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "581--591", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2959251", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2959251", abstract = "Dimensional sentiment analysis aims to recognize continuous numerical values in multiple dimensions such as the valence-arousal (VA) space. Compared to the categorical approach that focuses on sentiment classification such as binary classification (i.e., \ldots{})", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Azad:2020:RSF, author = "Abul Azad and Lamine Mili", title = "Robust Speech Filter and Voice Encoder Parameter Estimation Using the Phase--Phase Correlator", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "592--604", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2961556", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2961556", abstract = "In recent years, linear prediction voice encoders have become very efficient in terms of computing execution time and channel bandwidth usage while providing, in the absence of impulsive noise, natural sounding synthetic speech signals. This good \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fahim:2020:MSD, author = "Abdullah Fahim and Prasanga N. Samarasinghe and Thushara D. Abhayapala", title = "Multi-Source {DOA} Estimation Through Pattern Recognition of the Modal Coherence of a Reverberant Soundfield", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "605--618", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2960734", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2960734", abstract = "We propose a novel multi-source direction of arrival (DOA) estimation technique using a convolutional neural network algorithm which learns the modal coherence patterns of an incident soundfield through measured spherical harmonic coefficients. We train \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Laufer:2020:MEC, author = "Yaron Laufer and Bracha Laufer-Goldshtein and Sharon Gannot", title = "{ML} Estimation and {CRBs} for Reverberation, Speech, and Noise {PSDs} in Rank-Deficient Noise Field", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "619--634", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2962689", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2962689", abstract = "Speech communication systems are prone to performance degradation in reverberant and noisy acoustic environments. Dereverberation and noise reduction algorithms typically require several model parameters, e.g.\&\#x00A0;the speech, reverberation and noise \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2020:NSD, author = "Zhongqing Wang and Qingying Sun and Shoushan Li and Qiaoming Zhu and Guodong Zhou", title = "Neural Stance Detection With Hierarchical Linguistic Representations", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "635--645", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.2963954", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.2963954", abstract = "Stance detection aims to assign a stance label (i.e., favor or against) to a post towards a specific target. Recently, there is a growing interest in adopting neural models to detect stance of a document. However, most of \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2020:MSE, author = "Ruizhi Li and Xiaofei Wang and Sri Harish Mallidi and Shinji Watanabe and Takaaki Hori and Hynek Hermansky", title = "Multi-Stream End-to-End Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "646--655", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2959721", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2959721", abstract = "Attention-based methods and Connectionist Temporal Classification (CTC) network have been promising research directions for end-to-end (E2E) Automatic Speech Recognition (ASR). The joint CTC/Attention model has achieved great success by utilizing both \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Maeno:2020:SHD, author = "Yu Maeno and Yuki Mitsufuji and Prasanga N. Samarasinghe and Naoki Murata and Thushara D. Abhayapala", title = "Spherical-Harmonic-Domain Feedforward Active Noise Control Using Sparse Decomposition of Reference Signals from Distributed Sensor Arrays", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "656--670", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2019.2962684", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2019.2962684", abstract = "Active acoustic noise attenuation over a sizable space is a challenging problem in signal processing. The noise attenuation performance of feedforward active noise control (ANC) relies on the preciseness of a reference signal of a primary noise field. To \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2020:JSS, author = "Qingyu Zhou and Nan Yang and Furu Wei and Shaohan Huang and Ming Zhou and Tiejun Zhao", title = "A Joint Sentence Scoring and Selection Framework for Neural Extractive Document Summarization", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "671--681", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.2964427", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.2964427", abstract = "Extractive document summarization methods aim to extract important sentences to form a summary. Previous works perform this task by first scoring all sentences in the document then selecting most informative ones; while we propose to jointly learn the two \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kukanov:2020:MFM, author = "Ivan Kukanov and Trung Ngo Trong and Ville Hautam{\"a}ki and Sabato Marco Siniscalchi and Valerio Mario Salerno and Kong Aik Lee", title = "Maximal Figure-of-Merit Framework to Detect Multi-Label Phonetic Features for Spoken Language Recognition", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "682--695", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.2964953", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.2964953", abstract = "Bottleneck features (BNFs) generated with a deep neural network (DNN) have proven to boost spoken language recognition accuracy over basic spectral features significantly. However, BNFs are commonly extracted using language-dependent tied-context phone \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Koyama:2020:OSS, author = "Shoichi Koyama and Gilles Chardon and Laurent Daudet", title = "Optimizing Source and Sensor Placement for Sound Field Control: an Overview", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "696--714", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.2964958", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.2964958", abstract = "In order to control an acoustic field inside a target region, it is important to choose suitable positions of secondary sources (loudspeakers) and sensors (control points/microphones). This article provides an overview of state-of-the-art source and \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ando:2020:CSE, author = "Atsushi Ando and Ryo Masumura and Hosana Kamiyama and Satoshi Kobashikawa and Yushi Aono and Tomoki Toda", title = "Customer Satisfaction Estimation in Contact Center Calls Based on a Hierarchical Multi-Task Model", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "715--728", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.2966857", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.2966857", abstract = "This article presents a novel customer satisfaction\&\#x00A0;(CS) estimation method that outputs both turn-level and call-level estimations simultaneously. Our key idea is to directly apply turn-level estimation results to call-level estimation and optimize \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dietzen:2020:ISC, author = "Thomas Dietzen and Simon Doclo and Marc Moonen and Toon van Waterschoot", title = "Integrated Sidelobe Cancellation and Linear Prediction {Kalman} Filter for Joint Multi-Microphone Speech Dereverberation, Interfering Speech Cancellation, and Noise Reduction", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "740--754", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.2966869", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.2966869", abstract = "In multi-microphone speech enhancement, reverberation as well as additive noise and/or interfering speech are commonly suppressed by deconvolution and spatial filtering, e.g., using multi-channel linear prediction (MCLP) on the one hand and beamforming, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dietzen:2020:SRB, author = "Thomas Dietzen and Simon Doclo and Marc Moonen and Toon van Waterschoot", title = "Square Root-Based Multi-Source Early {PSD} Estimation and Recursive {RETF} Update in Reverberant Environments by Means of the Orthogonal {Procrustes} Problem", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "755--769", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.2966891", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.2966891", abstract = "Multi-channel short-time Fourier transform (STFT) domain-based processing of reverberant microphone signals commonly relies on power-spectral-density (PSD) estimates of early source images, where early refers to reflections contained within the same STFT \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2020:PTP, author = "Liwen Zhang and Ziqiang Shi and Jiqing Han", title = "Pyramidal Temporal Pooling With Discriminative Mapping for Audio Classification", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "770--784", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.2966868", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.2966868", abstract = "Audio signals are temporally-structured data, and learning their discriminative representations containing temporal information is crucial for the audio classification. In this article, we propose an audio representation learning method with a \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2020:MIH, author = "Mengfan Zhang and Zhongshu Ge and Tiejun Liu and Xihong Wu and Tianshu Qu", title = "Modeling of Individual {HRTFs} Based on Spatial Principal Component Analysis", journal = j-IEEE-ACM-TASLP, volume = "28", number = "??", pages = "785--797", month = jan, year = "2020", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.2967539", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu May 27 17:56:35 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.2967539", abstract = "Head-related transfer function (HRTF) plays an important role in the construction of 3D auditory display. This article presents an individual HRTF modeling method using deep neural networks based on spatial principal component analysis. The HRTFs are \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jia:2021:HRI, author = "Bijue Jia and Jiancheng Lv and Xi Peng and Yao Chen and Shenglan Yang", title = "Hierarchical Regulated Iterative Network for Joint Task of Music Detection and Music Relative Loudness Estimation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1--13", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3030484", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3030484", abstract = "One practical requirement of the music copyright management is the estimation of music relative loudness, which is mostly ignored in existing music detection works. To solve this problem, we study the joint task of music detection and music relative \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dawalatabad:2021:NAU, author = "Nauman Dawalatabad and Srikanth Madikeri and C. Chandra Sekhar and Hema A. Murthy", title = "Novel Architectures for Unsupervised Information Bottleneck Based Speaker Diarization of Meetings", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "14--27", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3036231", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3036231", abstract = "Speaker diarization is an important problem that is topical, and is especially useful as a preprocessor for conversational speech related applications. The objective of this article is two-fold: (i) segment initialization by uniformly distributing speaker \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yousefi:2021:BBH, author = "Midia Yousefi and John H. L. Hansen", title = "Block-Based High Performance {CNN} Architectures for Frame-Level Overlapping Speech Detection", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "28--40", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3036237", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3036237", abstract = "Speech technology systems such as Automatic Speech Recognition (ASR), speaker diarization, speaker recognition, and speech synthesis have advanced significantly by the emergence of deep learning techniques. However, none of these voice-enabled systems \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cheng:2021:DAN, author = "Jiaming Cheng and Ruiyu Liang and Zhenlin Liang and Li Zhao and Chengwei Huang and Bj{\"o}rn Schuller", title = "A Deep Adaptation Network for Speech Enhancement: Combining a Relativistic Discriminator With Multi-Kernel Maximum Mean Discrepancy", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "41--53", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3036611", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3036611", abstract = "In deep-learning-based speech enhancement (SE) systems, trained models are often used to handle unseen noise types and language environments in real-life scenarios. However, since production environments differ from training conditions, mismatch problems \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anders:2021:CAN, author = "Franz Anders and Mario Hlawitschka and Mirco Fuchs", title = "Comparison of Artificial Neural Network Types for Infant Vocalization Classification", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "54--67", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3037414", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3037414", abstract = "In this study we compared various neural network types for the task of automatic infant vocalization classification, i.e convolutional, recurrent and fully-connected networks as well as combinations of thereof. The goal was to first determine the optimal \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nakamura:2021:HTF, author = "Tomohiko Nakamura and Hirokazu Kameoka", title = "Harmonic-Temporal Factor Decomposition for Unsupervised Monaural Separation of Harmonic Sounds", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "68--82", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3037487", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3037487", abstract = "We address the problem of separating a monaural mixture of harmonic sounds into the audio signals of individual semitones in an unsupervised manner. Unsupervised monaural audio source separation has thus far been mainly addressed by two approaches: one \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ahrens:2021:CSH, author = "Jens Ahrens and Stefan Bilbao", title = "Computation of Spherical Harmonic Representations of Source Directivity Based on the Finite-Distance Signature", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "83--92", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3037471", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3037471", abstract = "The measurement of directivity for sound sources that are not electroacoustic transducers is fundamentally limited because the source cannot be driven with arbitrary signals. A consequence is that directivity can only be measured at a sparse set of \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chuang:2021:IAS, author = "Shun-Po Chuang and Alexander H. Liu and Tzu-Wei Sung and Hung-yi Lee", title = "Improving Automatic Speech Recognition and Speech Translation via Word Embedding Prediction", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "93--105", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3037543", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3037543", abstract = "In this article, we target speech translation (ST). We propose lightweight approaches that generally improve either ASR or end-to-end ST models. We leverage continuous representations of words, known as word embeddings, to improve ASR in cascaded systems \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chai:2021:CEG, author = "Li Chai and Jun Du and Qing-Feng Liu and Chin-Hui Lee", title = "A Cross-Entropy-Guided Measure {(CEGM)} for Assessing Speech Recognition Performance and Optimizing {DNN}-Based Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "106--117", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3036783", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3036783", abstract = "A new cross-entropy-guided measure (CEGM) is proposed to indirectly assess accuracies of automatic speech recognition (ASR) of degraded speech with a speech enhancement front-end and without directly performing ASR experiments. The proposed CEGM is \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hu:2021:PGC, author = "De Hu and Zhe Chen and Fuliang Yin", title = "Passive Geometry Calibration for Microphone Arrays Based on Distributed Damped {Newton} Optimization", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "118--131", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3037532", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3037532", abstract = "Geometry calibration is an inherent challenge in distributed acoustic sensor networks. To mitigate this problem, a passive geometry calibration approach based on distributed damped Newton optimization is proposed. Specifically, a geometric cost function \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sisman:2021:OVC, author = "Berrak Sisman and Junichi Yamagishi and Simon King and Haizhou Li", title = "An Overview of Voice Conversion and Its Challenges: From Statistical Modeling to Deep Learning", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "132--157", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3038524", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3038524", abstract = "Speaker identity is one of the important characteristics of human speech. In voice conversion, we change the speaker identity from one to another, while keeping the linguistic content unchanged. Voice conversion involves multiple speech processing \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jin:2021:SSL, author = "Jilu Jin and Gongping Huang and Xuehan Wang and Jingdong Chen and Jacob Benesty and Israel Cohen", title = "Steering Study of Linear Differential Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "158--170", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3038566", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3038566", abstract = "Differential microphone arrays (DMAs) can achieve high directivity and frequency-invariant spatial response with small apertures; they also have a great potential to be used in a wide spectrum of applications for high-fidelity sound acquisition. Although \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lee:2021:PAF, author = "Ching-Hua Lee and Bhaskar D. Rao and Harinath Garudadri", title = "Proportionate Adaptive Filtering Algorithms Derived Using an Iterative Reweighting Framework", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "171--186", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3038526", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3038526", abstract = "In this paper, based on sparsity-promoting regularization techniques from the sparse signal recovery (SSR) area, least mean square (LMS)-type sparse adaptive filtering algorithms are derived. The approach mimics the iterative reweighted \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ahmed:2021:NAI, author = "Shakeel Ahmed and Muhammad Tufail and Muhammad Rehan and Tanveer Abbas and Amna Majid", title = "A Novel Approach for Improved Noise Reduction Performance in Feed-Forward Active Noise Control Systems With (Loudspeaker) Saturation Non-Linearity in the Secondary Path", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "187--197", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3039607", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3039607", abstract = "In active noise control systems, the performance of the most celebrated filtered-x-least mean square (FxLMS) adaptive algorithm is degraded in the presence of non-linearity in the secondary path. In this article, we propose a novel approach to improve the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fan:2021:GRF, author = "Cunhang Fan and Jiangyan Yi and Jianhua Tao and Zhengkun Tian and Bin Liu and Zhengqi Wen", title = "Gated Recurrent Fusion With Joint Training Framework for Robust End-to-End Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "198--209", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3039600", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3039600", abstract = "The joint training framework for speech enhancement and recognition methods have obtained quite good performances for robust end-to-end automatic speech recognition (ASR). However, these methods only utilize the enhanced feature as the input of the speech \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Edraki:2021:SIP, author = "Amin Edraki and Wai-Yip Chan and Jesper Jensen and Daniel Fogerty", title = "Speech Intelligibility Prediction Using Spectro-Temporal Modulation Analysis", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "210--225", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3039929", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3039929", abstract = "Spectro-temporal modulations are believed to mediate the analysis of speech sounds in the human primary auditory cortex. Inspired by humans\&\#x2019; robustness in comprehending speech in challenging acoustic environments, we propose an intrusive speech \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Son:2021:DSA, author = "Phan Le Son", title = "On the Design of Sparse Arrays With Frequency-Invariant Beam Pattern", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "226--238", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3040033", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3040033", abstract = "Beamformer performs spatial filtering to preserve the desired signal while suppressing interfering signals and noise arriving from directions other than the direction of interest. However, the beam pattern of the conventional beamformer is dependent on \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Menzies:2021:RCM, author = "Dylan Menzies and Philip Coleman and Filippo Maria Fazi", title = "A Room Compensation Method by Modification of Reverberant Audio Objects", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "239--252", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3036781", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3036781", abstract = "Conventional channel-based room equalisation can reduce overall colouration caused by the room response, however it cannot separately correct the colouration caused by the late and early parts of the response, or consider the reverberance in the source \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hu:2021:MSD, author = "Yonggang Hu and Thushara D. Abhayapala and Prasanga N. Samarasinghe", title = "Multiple Source Direction of Arrival Estimations Using Relative Sound Pressure Based {MUSIC}", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "253--264", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3039569", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3039569", abstract = "Subspace approach of MUSIC (multiple signal classification) has become one of the most popular multi-source direction of arrival (DOA) estimations due to its easy implementation in practice. However, its localization accuracy is vulnerable to noise. This \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kan:2021:TLE, author = "Alan Kan and Qinglin Meng", title = "The Temporal Limits Encoder as a Sound Coding Strategy for Bilateral Cochlear Implants", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "265--273", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3039601", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3039601", abstract = "The difference in binaural benefit between bilateral cochlear implant (CI) users and normal hearing (NH) listeners has typically been attributed to CI sound coding strategies not encoding the acoustic fine structure (FS) interaural time differences (ITD). \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2021:EMP, author = "Rui Liu and Berrak Sisman and Feilong Bao and Jichen Yang and Guanglai Gao and Haizhou Li", title = "Exploiting Morphological and Phonological Features to Improve Prosodic Phrasing for {Mongolian} Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "274--285", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3040523", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3040523", abstract = "Prosodic phrasing is an important factor that affects naturalness and intelligibility in text-to-speech synthesis. Studies show that deep learning techniques improve prosodic phrasing when large text and speech corpus are available. However, for low-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ma:2021:MCA, author = "Fei Ma and Thushara D. Abhayapala and Wen Zhang", title = "Multiple Circular Arrays of Vector Sensors for Real-Time Sound Field Analysis", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "286--299", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3040533", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3040533", abstract = "This article proposes multiple circular arrays of vector sensors for analyzing the three dimensional sound field. By exploiting the fact that a finite number of spatial basis functions can represent the sound field within a region, the designed arrays \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Diaz-Guerra:2021:RSS, author = "David Diaz-Guerra and Antonio Miguel and Jose R. Beltran", title = "Robust Sound Source Tracking Using {SRP-PHAT} and {$3$D} Convolutional Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "300--311", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3040031", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3040031", abstract = "In this article, we present a new single sound source DOA estimation and tracking system based on the well-known SRP-PHAT algorithm and a three-dimensional Convolutional Neural Network. It uses SRP-PHAT power maps as input features of a fully \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Trinh:2021:DCL, author = "Viet Anh Trinh and Michael Mandel", title = "Directly Comparing the Listening Strategies of Humans and Machines", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "312--323", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3040545", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3040545", abstract = "Automatic speech recognition (ASR) has reached human performance on many clean speech corpora, but it remains worse than human listeners in noisy environments. This paper investigates whether this difference in performance might be due to a difference in \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sari:2021:ANJ, author = "Leda Sari and Mark Hasegawa-Johnson and Samuel Thomas", title = "Auxiliary Networks for Joint Speaker Adaptation and Speaker Change Detection", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "324--333", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3040626", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3040626", abstract = "Speaker adaptation and speaker change detection have both been studied extensively to improve automatic speech recognition (ASR). In many cases, these two problems are investigated separately: speaker change detection is implemented first to obtain single-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2021:MAS, author = "Jielong Yang and Xionghu Zhong and Weiguang Chen and Wenwu Wang", title = "Multiple Acoustic Source Localization in Microphone Array Networks", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "334--347", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3039390", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3039390", abstract = "The problem of multiple acoustic source localization using observations from a microphone array network is investigated in this article. Multiple source signals are assumed to be window-disjoint-orthogonal (WDO) on the time-frequency (TF) domain and time \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2021:TPB, author = "Bin Wu and Sakriani Sakti and Jinsong Zhang and Satoshi Nakamura", title = "Tackling Perception Bias in Unsupervised Phoneme Discovery Using {DPGMM-RNN} Hybrid Model and Functional Load", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "348--362", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3042016", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3042016", abstract = "The human perception of phonemes is biased against speech sounds. The lack of correspondence between perceptual phonemes and acoustic signals forms a big challenge in designing unsupervised algorithms to distinguish phonemes from sound. We propose the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lee:2021:FGS, author = "Taewoong Lee and Liming Shi and Jesper Kj{\ae}r Nielsen and Mads Gr{\ae}sb{\o}ll Christensen", title = "Fast Generation of Sound Zones Using Variable Span Trade-Off Filters in the {DFT}-Domain", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "363--378", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3042701", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3042701", abstract = "The creation of sound zones with frequency-domain variable span trade-off filters (VAST) is investigated herein. Both narrowband and broadband discrete Fourier transform (DFT)-domain VAST approaches are proposed, and we discuss their relationship to the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jia:2021:MSD, author = "Maoshen Jia and Yuxuan Wu and Changchun Bao and Christian Ritz", title = "Multi-Source {DOA} Estimation in Reverberant Environments by Jointing Detection and Modeling of Time-Frequency Points", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "379--392", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3042705", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3042705", abstract = "In this article, the direction of arrival (DOA) estimation of multiple speech sources in reverberant environments is investigated based on the recording of a soundfield microphone. First, the recordings are analyzed in the time-frequency (T-F) domain to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xue:2021:SEB, author = "Wei Xue and Alastair H. Moore and Mike Brookes and Patrick A. Naylor", title = "Speech Enhancement Based on Modulation-Domain Parametric Multichannel {Kalman} Filtering", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "393--405", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3040850", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3040850", abstract = "Recently we presented a modulation-domain multichannel Kalman filtering (MKF) algorithm for speech enhancement, which jointly exploits the inter-frame modulation-domain temporal evolution of speech and the inter-channel spatial correlation to estimate the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Song:2021:KGE, author = "Wei Song and Jingjin Guo and Ruiji Fu and Ting Liu and Lizhen Liu", title = "A Knowledge Graph Embedding Approach for Metaphor Processing", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "406--420", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3040507", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3040507", abstract = "Metaphor is a figure of speech that describes one thing (a target) by mentioning another thing (a source) in a way that is not literally true. Metaphor understanding is an interesting but challenging problem in natural language processing. This paper \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cheng:2021:ERF, author = "Longbiao Cheng and Xingwei Sun and Dingding Yao and Junfeng Li and Yonghong Yan", title = "Estimation Reliability Function Assisted Sound Source Localization With Enhanced Steering Vector Phase Difference", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "421--435", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3043107", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3043107", abstract = "The performance of the traditional direction-of-arrival (DOA) estimation algorithms greatly degrades in noisy and reverberant environments. Recently, deep learning has been applied to sound source localization and provided the substantial improvement in \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yu:2021:RAP, author = "Wangyang Yu and W. Bastiaan Kleijn", title = "Room Acoustical Parameter Estimation From Room Impulse Responses Using Deep Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "436--447", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3043115", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3043115", abstract = "We describe a new method to estimate the geometry of a room and reflection coefficients given room impulse responses. The method utilizes convolutional neural networks to estimate the room geometry and multilayer perceptrons to estimate the reflection \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ferrer:2021:APA, author = "Miguel Ferrer and Maria de Diego and Gema Pi{\~n}ero and Alberto Gonzalez", title = "Affine Projection Algorithm Over Acoustic Sensor Networks for Active Noise Control", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "448--461", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3042590", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3042590", abstract = "Acoustic sensor networks (ASNs) are an effective solution to implement active noise control (ANC) systems by using distributed adaptive algorithms. On one hand, ASNs provide scalable systems where the signal processing load is distributed among the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gossling:2021:PAE, author = "Nico G{\"o}{\ss}ling and Daniel Marquardt and Simon Doclo", title = "Performance Analysis of the Extended Binaural {MVDR} Beamformer With Partial Noise Estimation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "462--476", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3043674", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3043674", abstract = "Besides reducing undesired noise sources and limiting speech distortion, another important objective of a binaural noise reduction algorithm is the preservation of the binaural cues of all sound sources in the acoustic scene. In this paper, we consider \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gosztolya:2021:EBA, author = "G{\'a}bor Gosztolya and R{\'o}bert Busa-Fekete", title = "Ensemble Bag-of-Audio-Words Representation Improves Paralinguistic Classification Accuracy", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "477--488", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3044465", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3044465", abstract = "A recently introduced, effective feature extraction technique for computational paralinguistics is that of Bag-of-Audio-Words (BoAW), where we cluster the frame-level training vectors, and represent each speech utterance based on the cluster of its \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mertins:2021:RIR, author = "Alfred Mertins and Marco Maass and Fabrice Katzberg", title = "Room Impulse Response Reshaping and Crosstalk Cancellation Using Convex Optimization", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "489--502", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3044444", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3044444", abstract = "In this article, a new convex formulation for the acoustic channel-equalization problem is proposed and efficient ways for solving it are presented. Both the alternating direction method of multipliers and a proximal algorithm are studied for \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bai:2021:ITS, author = "Xuefeng Bai and Pengbo Liu and Yue Zhang", title = "Investigating Typed Syntactic Dependencies for Targeted Sentiment Classification Using Graph Attention Neural Network", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "503--514", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3042009", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3042009", abstract = "Targeted sentiment classification predicts the sentiment polarity on given target mentions in input texts. Dominant methods employ neural networks for encoding the input sentence and extracting relations between target mentions and their contexts. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Borgstrom:2021:SEA, author = "Bengt J. Borgstr{\"o}m and Michael S. Brandstein", title = "{Speech Enhancement via Attention Masking Network (SEAMNET)}: an End-to-End System for Joint Suppression of Noise and Reverberation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "515--526", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3043655", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3043655", abstract = "This paper proposes the Speech Enhancement via Attention Masking Network (SEAMNET), a neural network-based end-to-end single-channel speech enhancement system designed for joint suppression of noise and reverberation. It formalizes an end-to-end network \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Miramont:2021:VJE, author = "Juan M. Miramont and Marcelo A. Colominas and Gast{\'o}n Schlotthauer", title = "Voice Jitter Estimation Using High-Order Synchrosqueezing Operators", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "527--536", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3045265", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3045265", abstract = "Voice jitter is defined as a random perturbation of the glottal cycle duration which can be useful for voice parametrization and that usually depends on finding fiducial points in this signal. In this paper, a novel application of the Fourier-based high-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2021:SSU, author = "Peidong Wang and Zhuo Chen and DeLiang Wang and Jinyu Li and Yifan Gong", title = "Speaker Separation Using Speaker Inventories and Estimated Speech", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "537--546", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3045556", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3045556", abstract = "We propose speaker separation using speaker inventories and estimated speech (SSUSIES), a framework leveraging speaker profiles and estimated speech for speaker separation. SSUSIES contains two methods, speaker separation using speaker inventories (SSUSI) \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cumani:2021:DSV, author = "Sandro Cumani", title = "On the Distribution of Speaker Verification Scores: Generative Models for Unsupervised Calibration", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "547--562", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3040103", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3040103", abstract = "Speaker verification systems whose outputs can be interpreted as log-likelihood ratios (LLR) allow for cost-effective decisions by comparing the system outputs to application-defined thresholds depending only on prior information. Classifiers often \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chien:2021:AMV, author = "Yu-Ren Chien and J{\'o}n Gu{\eth}nason", title = "Acoustic Measure of Vocal Strain Based on Glottal Airflow Periodicity", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "563--574", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3044168", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3044168", abstract = "In the clinical practice of dysphonia, the effects of treatment are traditionally monitored by a sequence of auditory-perceptual assessments aimed at measuring vocal quality for the patient. Alternatively, acoustic measurement of vocal quality promises to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shen:2021:RRA, author = "Xingfa Shen and Xingkun Shao and Quanbo Ge and Lili Liu", title = "{RARS}: Recognition of Audio Recording Source Based on Residual Neural Network", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "575--584", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3039597", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3039597", abstract = "With the popularity of mobile devices and the emergence of various audio-editing tools, it becomes easier to produce and forge audio files. Many criminals will forge false audio information as evidence. Therefore, audio forensics technology becomes \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2021:LGE, author = "Gang Chen and Yang Liu and Huanbo Luan and Meng Zhang and Qun Liu and Maosong Sun", title = "Learning to Generate Explainable Plots for Neural Story Generation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "585--593", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3039606", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3039606", abstract = "Story generation is an important natural language processing task that aims to generate coherent stories automatically. While the use of neural networks has proven effective in improving story generation, how to learn to generate an explainable high-level \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2021:NCD, author = "Wenxing Yang and Jacob Benesty and Gongping Huang and Jingdong Chen", title = "A New Class of Differential Beamformers", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "594--606", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3045561", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3045561", abstract = "Differential microphone arrays (DMAs) have been used in a wide range of applications for high-fidelity acoustic signal acquisition and enhancement. In the design of differential beamformers, three of the widely used measures are the directivity factor (DF). \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mitsufuji:2021:MBS, author = "Yuki Mitsufuji and Norihiro Takamune and Shoichi Koyama and Hiroshi Saruwatari", title = "Multichannel Blind Source Separation Based on Evanescent-Region-Aware Non-Negative Tensor Factorization in Spherical Harmonic Domain", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "607--617", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3045528", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3045528", abstract = "There is growing interest in new audio formats in the context of virtual reality (VR), and higher-order ambisonics (HOA) is preferred for VR systems to transmit recorded scenes owing to its transmission efficiency and its flexibility to work with \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fischer:2021:RCM, author = "D{\"o}rte Fischer and Simon Doclo", title = "Robust Constrained {MFMVDR} Filters for Single-Channel Speech Enhancement Based on Spherical Uncertainty Set", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "618--631", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3042013", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3042013", abstract = "Aiming at exploiting speech correlation across consecutive time-frames in the short-time Fourier transform domain, the multi-frame minimum variance distortionless response (MFMVDR) filter for single-channel speech enhancement has been proposed. The MFMVDR \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2021:DBB, author = "Xudong Zhao and Jacob Benesty and Jingdong Chen and Gongping Huang", title = "Differential Beamforming From the Beampattern Factorization Perspective", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "632--643", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3046082", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3046082", abstract = "Differential beamformers have demonstrated a great potential in forming frequency-invariant beampatterns and achieving high directivity factors. Most conventional approaches design differential beamformers in such a way that their beampatterns resemble a \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kawara:2021:PETa, author = "Yuki Kawara and Chenhui Chu and Yuki Arase", title = "Preordering Encoding on Transformer for Translation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "644--655", month = jan, year = "2021", DOI = "https://doi.org/10.1109/TASLP.2020.3042001", bibdate = "Thu May 27 17:56:39 MDT 2021", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2020.3042001", abstract = "The difference in word orders between source and target languages is a serious hurdle for machine translation. Preordering methods, which reorder the words in a source sentence before translation to obtain a similar word ordering with a target language, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2021:TCa, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "c1--ix", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3137064", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2021:ISP, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "c2--c2", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.3043180", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2021:TCb, author = "Anonymous", title = "Table of Contents", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "x--xx", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3137066", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kawara:2021:PETb, author = "Yuki Kawara and Chenhui Chu and Yuki Arase", title = "Preordering Encoding on Transformer for Translation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "644--655", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.3042001", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kameoka:2021:MMV, author = "Hirokazu Kameoka and Wen-Chin Huang and Kou Tanaka and Takuhiro Kaneko and Nobukatsu Hojo and Tomoki Toda", title = "Many-to-Many Voice Transformer Network", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "656--670", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.3047262", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2021:SRM, author = "Jie Zhang and Huawei Chen and Li-Rong Dai and Richard Christian Hendriks", title = "A Study on Reference Microphone Selection for Multi-Microphone Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "671--683", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.3039930", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Politis:2021:OES, author = "Archontis Politis and Annamaria Mesaros and Sharath Adavanne and Toni Heittola and Tuomas Virtanen", title = "Overview and Evaluation of Sound Event Localization and Detection in {DCASE 2019}", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "684--698", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.3047233", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Niermann:2021:LEN, author = "Markus Niermann and Peter Vary", title = "Listening Enhancement in Noisy Environments: Solutions in Time and Frequency Domain", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "699--709", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.3047234", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lee:2021:GRC, author = "Hyeonseung Lee and Woo Hyun Kang and Sung Jun Cheon and Hyeongju Kim and Nam Soo Kim", title = "Gated Recurrent Context: Softmax-Free Attention for Online Encoder-Decoder Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "710--719", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3049344", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Vargas:2021:ITC, author = "Elizabeth Vargas and James R. Hopgood and Keith Brown and Kartic Subr", title = "On Improved Training of {CNN} for Acoustic Source Localisation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "720--732", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3049337", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cai:2021:DNS, author = "Yunqi Cai and Lantian Li and Andrew Abel and Xiaoyan Zhu and Dong Wang", title = "Deep Normalization for Speaker Vectors", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "733--744", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.3039573", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Huang:2021:PTS, author = "Wen-Chin Huang and Tomoki Hayashi and Yi-Chiao Wu and Hirokazu Kameoka and Tomoki Toda", title = "Pretraining Techniques for Sequence-to-Sequence Voice Conversion", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "745--755", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3049336", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jati:2021:TDW, author = "Arindam Jati and Amrutha Nadarajan and Raghuveer Peri and Karel Mundnich and Tiantian Feng and Benjamin Girault and Shrikanth Narayanan", title = "Temporal Dynamics of Workplace Acoustic Scenes: Egocentric Analysis and Prediction", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "756--769", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3050265", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Duan:2021:MFC, author = "Chaoqun Duan and Kehai Chen and Rui Wang and Masao Utiyama and Eiichiro Sumita and Conghui Zhu and Tiejun Zhao", title = "Modeling Future Cost for Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "770--781", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.3042006", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Munir:2021:ACS, author = "Kashif Munir and Hai Zhao and Zuchao Li", title = "Adaptive Convolution for Semantic Role Labeling", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "782--791", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2020.3048665", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2021:QPP, author = "Yi-Chiao Wu and Tomoki Hayashi and Takuma Okamoto and Hisashi Kawai and Tomoki Toda", title = "Quasi-Periodic Parallel {WaveGAN}: a Non-Autoregressive Raw Waveform Generative Model With Pitch-Dependent Dilated Convolution Neural Network", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "792--806", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3051765", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yuan:2021:EMR, author = "Weitao Yuan and Bofei Dong and Shengbei Wang and Masashi Unoki and Wenwu Wang", title = "Evolving Multi-Resolution Pooling {CNN} for Monaural Singing Voice Separation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "807--822", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3051331", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shi:2021:GPS, author = "Liming Shi and Taewoong Lee and Lijun Zhang and Jesper Kj{\ae}r Nielsen and Mads Gr{\ae}sb{\o}ll Christensen", title = "Generation of Personal Sound Zones With Physical Meaningful Constraints and Conjugate Gradient Method", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "823--837", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3052564", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2021:RSB, author = "Xi Chen and Jacob Benesty and Gongping Huang and Jingdong Chen", title = "On the Robustness of the Superdirective Beamformer", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "838--849", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3053410", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2021:GIS, author = "Xinsheng Wang and Tingting Qiao and Jihua Zhu and Alan Hanjalic and Odette Scharenborg", title = "Generating Images From Spoken Descriptions", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "850--865", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3053391", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Balaraman:2021:DAD, author = "Vevake Balaraman and Bernardo Magnini", title = "Domain-Aware Dialogue State Tracker for Multi-Domain Dialogue Systems", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "866--873", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3054309", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2021:EBE, author = "Xixin Wu and Yuewen Cao and Hui Lu and Songxiang Liu and Shiyin Kang and Zhiyong Wu and Xunying Liu and Helen Meng", title = "Exemplar-Based Emotive Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "874--886", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3052688", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dinkel:2021:TDR, author = "Heinrich Dinkel and Mengyue Wu and Kai Yu", title = "Towards Duration Robust Weakly Supervised Sound Event Detection", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "887--900", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3054313", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ben-Hur:2021:BRB, author = "Zamir Ben-Hur and David Lou Alon and Ravish Mehra and Boaz Rafaely", title = "Binaural Reproduction Based on Bilateral Ambisonics and Ear-Aligned {HRTFs}", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "901--913", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3055038", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Aichinger:2021:SAS, author = "Philipp Aichinger and Franz Pernkopf", title = "Synthesis and Analysis-By-Synthesis of Modulated Diplophonic Glottal Area Waveforms", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "914--926", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3053387", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kelly:2021:ACL, author = "Finnian Kelly and John H. L. Hansen", title = "Analysis and Calibration of {Lombard} Effect and Whisper for Speaker Recognition", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "927--942", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3053388", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Muller:2021:LDV, author = "Matthias M{\"u}ller and Thilo Schulz and Tatiana Ermakova and Philipp P. Caffier", title = "Lyric or Dramatic --- Vibrato Analysis for Voice Type Classification in Professional Opera Singers", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "943--955", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3054299", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rodriguez:2021:IWC, author = "Dem{\'o}stenes Z. Rodr{\'\i}guez and Dick Carrillo and Miguel A. Ram{\'\i}rez and Pedro H. J. Nardelli and Sebastian M{\"o}ller", title = "Incorporating Wireless Communication Parameters Into the E-Model Algorithm", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "956--968", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3057955", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zong:2021:NLE, author = "Tianrui Zong and Yong Xiang and Iynkaran Natgunanathan and Longxiang Gao and Guang Hua and Wanlei Zhou", title = "Non-Linear-Echo Based Anti-Collusion Mechanism for Audio Signals", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "969--984", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3058892", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lian:2021:CCT, author = "Zheng Lian and Bin Liu and Jianhua Tao", title = "{CTNet}: Conversational Transformer Network for Emotion Recognition", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "985--1000", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3049898", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2021:NMT, author = "Jiacheng Zhang and Huanbo Luan and Maosong Sun and Feifei Zhai and Jingfang Xu and Yang Liu", title = "Neural Machine Translation With Explicit Phrase Alignment", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1001--1010", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3057831", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Vukovic:2021:CLE, author = "Maria Vukovic and Melissa Stolar and Margaret Lech", title = "Cognitive Load Estimation From Speech Commands to Simulated Aircraft", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1011--1022", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3057492", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hu:2021:GCA, author = "De Hu and Zhe Chen and Fuliang Yin", title = "Geometry Calibration for Acoustic Transceiver Networks Based on Network {Newton} Distributed Optimization", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1023--1032", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3058539", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Saito:2021:PSA, author = "Yuki Saito and Shinnosuke Takamichi and Hiroshi Saruwatari", title = "Perceptual-Similarity-Aware Deep Speaker Representation Learning for Multi-Speaker Generative Modeling", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1033--1048", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3059114", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sakata:2021:VTL, author = "Tadashi Sakata and Naomitsu Ikeda and Yuichi Ueda and Akira Watanabe", title = "Vocal Tract Length Estimation Using Accumulated Means of Formants and Its Effects on Speaker-Normalization", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1049--1064", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3060172", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2021:MMP, author = "Jichen Yang and Hongji Wang and Rohan Kumar Das and Yanmin Qian", title = "Modified Magnitude-Phase Spectrum Information for Spoofing Detection", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1065--1078", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3060810", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qian:2021:AVD, author = "Yanmin Qian and Zhengyang Chen and Shuai Wang", title = "Audio-Visual Deep Neural Network for Robust Person Verification", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1079--1092", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3057230", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lin:2021:DSM, author = "Peiqin Lin and Meng Yang and Jianhuang Lai", title = "Deep Selective Memory Network With Selective Attention and Inter-Aspect Modeling for Aspect Level Sentiment Classification", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1093--1106", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3058540", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kamper:2021:IAW, author = "Herman Kamper and Yevgen Matusevych and Sharon Goldwater", title = "Improved Acoustic Word Embeddings for Zero-Resource Languages Using Multilingual Transfer", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1107--1118", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3060805", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2021:ABP, author = "Weiqing Wang and Jin Pan and Hua Yi and Zhanmei Song and Ming Li", title = "Audio-Based Piano Performance Evaluation for Beginners With Convolutional Neural Network and Attention Mechanism", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1119--1133", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3061267", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2021:QPW, author = "Yi-Chiao Wu and Tomoki Hayashi and Patrick Lumban Tobing and Kazuhiro Kobayashi and Tomoki Toda", title = "Quasi-Periodic {WaveNet}: an Autoregressive Raw Waveform Generative Model With Pitch-Dependent Dilated Convolution Neural Network", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1134--1148", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3061245", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Valimaki:2021:LRS, author = "Vesa V{\"a}lim{\"a}ki and Karolina Prawda", title = "Late-Reverberation Synthesis Using Interleaved Velvet-Noise Sequences", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1149--1160", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3060165", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2021:MTD, author = "Zhuosheng Zhang and Junlong Li and Hai Zhao", title = "Multi-Turn Dialogue Reading Comprehension With Pivot Turns and Knowledge", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1161--1173", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3058616", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gaultier:2021:SBA, author = "Cl{\'e}ment Gaultier and Sr an {Kiti } and R{\'e}mi Gribonval and Nancy Bertin", title = "Sparsity-Based Audio Declipping Methods: Selected Overview, New Algorithms, and Large-Scale Evaluation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1174--1187", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3059264", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Birnie:2021:MSS, author = "Lachlan Birnie and Thushara Abhayapala and Vladimir Tourbabin and Prasanga Samarasinghe", title = "Mixed Source Sound Field Translation for Virtual Binaural Application With Perceptual Validation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1188--1203", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3061939", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pal:2021:MLL, author = "Monisankha Pal and Manoj Kumar and Raghuveer Peri and Tae Jin Park and So Hyun Kim and Catherine Lord and Somer Bishop and Shrikanth Narayanan", title = "Meta-Learning With Latent Space Clustering in Generative Adversarial Network for Speaker Diarization", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1204--1219", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3061885", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2021:SSR, author = "Jie Zhang and Jun Du and Li-Rong Dai", title = "Sensor Selection for Relative Acoustic Transfer Function Steered Linearly-Constrained Beamformers", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1220--1232", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3064399", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xie:2021:ZSA, author = "Huang Xie and Tuomas Virtanen", title = "Zero-Shot Audio Classification Via Semantic Embeddings", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1233--1242", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3065234", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2021:PUS, author = "Xianhong Chen and Changchun Bao", title = "Phoneme-Unit-Specific Time-Delay Neural Network for Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1243--1255", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3065202", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shi:2021:OOC, author = "Dongyuan Shi and Woon-Seng Gan and Bhan Lam and Shulin Wen and Xiaoyi Shen", title = "Optimal Output-Constrained Active Noise Control Based on Inverse Adaptive Modeling Leak Factor Estimate", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1256--1269", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3065730", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pandey:2021:DCS, author = "Ashutosh Pandey and DeLiang Wang", title = "Dense {CNN} With Self-Attention for Time-Domain Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1270--1279", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3064421", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qin:2021:KWL, author = "Libo Qin and Wanxiang Che and Minheng Ni and Yangming Li and Ting Liu", title = "Knowing Where to Leverage: Context-Aware Graph Convolutional Network With an Adaptive Fusion Layer for Contextual Spoken Language Understanding", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1280--1289", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3053400", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2021:TLS, author = "Mingyang Zhang and Yi Zhou and Li Zhao and Haizhou Li", title = "Transfer Learning From Speech Synthesis to Voice Conversion With Non-Parallel Training Data", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1290--1302", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3066047", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{He:2021:NNA, author = "Weipeng He and Petr Motlicek and Jean-Marc Odobez", title = "Neural Network Adaptation and Data Augmentation for Multi-Speaker Direction-of-Arrival Estimation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1303--1317", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3060257", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2021:ISG, author = "Yile Wang and Leyang Cui and Yue Zhang", title = "Improving Skip-Gram Embeddings Using {BERT}", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1318--1328", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3065201", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2021:DGB, author = "Linzhi Wu and Meishan Zhang", title = "Deep Graph-Based Character-Level {Chinese} Dependency Parsing", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1329--1339", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3067212", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bai:2021:IKE, author = "Ye Bai and Jiangyan Yi and Jianhua Tao and Zhengqi Wen and Zhengkun Tian and Shuai Zhang", title = "Integrating Knowledge Into End-to-End Speech Recognition From External Text-Only Data", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1340--1351", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3066274", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cho:2021:CML, author = "Byung Joon Cho and Hyung-Min Park", title = "Convolutional Maximum-Likelihood Distortionless Response Beamforming With Steering Vector Estimation for Robust Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1352--1367", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3067202", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Michelsanti:2021:ODL, author = "Daniel Michelsanti and Zheng-Hua Tan and Shi-Xiong Zhang and Yong Xu and Meng Yu and Dong Yu and Jesper Jensen", title = "An Overview of Deep-Learning-Based Audio-Visual Speech Enhancement and Separation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1368--1396", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3066303", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Itzhak:2021:DDK, author = "Gal Itzhak and Jacob Benesty and Israel Cohen", title = "On the Design of Differential {Kronecker} Product Beamformers", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1397--1410", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3069089", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ge:2021:PMP, author = "Zhongshu Ge and Liang Li and Tianshu Qu", title = "Partially Matching Projection Decoding Method Evaluation Under Different Playback Conditions", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1411--1423", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3068002", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mai:2021:AMS, author = "Sijie Mai and Songlong Xing and Haifeng Hu", title = "Analyzing Multimodal Sentiment Via Acoustic- and Visual-{LSTM} With Channel-Aware Temporal Convolution Network", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1424--1437", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3068598", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qian:2021:JMN, author = "Tao Qian and Meishan Zhang and Yinxia Lou and Daiwen Hua", title = "A Joint Model for Named Entity Recognition With Sentence-Level Entity Type Attentions", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1438--1448", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3069295", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sato:2021:ASP, author = "Ryotaro Sato and Kenta Niwa and Kazunori Kobayashi", title = "Ambisonic Signal Processing {DNNs} Guaranteeing Rotation, Scale and Time Translation Equivariance", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1449--1462", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3069193", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Park:2021:IEL, author = "Sooyeon Park and Jung-Woo Choi", title = "Iterative Echo Labeling Algorithm With Convex Hull Expansion for Room Geometry Estimation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1463--1478", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3069093", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hogg:2021:OSS, author = "Aidan O. T. Hogg and Christine Evers and Alastair H. Moore and Patrick A. Naylor", title = "Overlapping Speaker Segmentation Using Multiple Hypothesis Tracking of Fundamental Frequency", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1479--1490", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3067161", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sharma:2021:CEA, author = "Rajib Sharma and Israel Cohen and Baruch Berdugo", title = "Controlling Elevation and Azimuth Beamwidths With Concentric Circular Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1491--1502", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3072275", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2021:MIE, author = "Run-Ze Wang and Zhen-Hua Ling and Jing-Bo Zhou and Yu Hu", title = "A Multiple-Integration Encoder for Multi-Turn Text-to-{SQL} Semantic Parsing", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1503--1513", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3070726", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hu:2021:BLL, author = "Shoukang Hu and Xurong Xie and Shansong Liu and Jianwei Yu and Zi Ye and Mengzhe Geng and Xunying Liu and Helen Meng", title = "{Bayesian} Learning of {LF-MMI} Trained Time Delay Neural Networks for Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1514--1529", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3069080", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Torcoli:2021:OMP, author = "Matteo Torcoli and Thorsten Kastner and J{\"u}rgen Herre", title = "Objective Measures of Perceptual Audio Quality Reviewed: an Evaluation of Their Application Domain Dependence", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1530--1541", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3069302", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dinkel:2021:VAD, author = "Heinrich Dinkel and Shuai Wang and Xuenan Xu and Mengyue Wu and Kai Yu", title = "Voice Activity Detection in the Wild: a Data-Driven Approach Using Teacher-Student Training", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1542--1555", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3073596", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2021:DMS, author = "Songbin Li and Jingang Wang and Peng Liu and Miao Wei and Qiandong Yan", title = "Detection of Multiple Steganography Methods in Compressed Speech Based on Code Element Embedding, {Bi-LSTM} and {CNN} With Attention Mechanisms", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1556--1569", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3074752", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ma:2021:DSA, author = "Qianli Ma and Jiangyue Yan and Zhenxi Lin and Liuhong Yu and Zipeng Chen", title = "Deformable Self-Attention for Text Classification", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1570--1581", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3067210", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2021:EPW, author = "Ya-Jie Zhang and Zhen-Hua Ling", title = "Extracting and Predicting Word-Level Style Variations for Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1582--1593", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3074757", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bohlender:2021:ETC, author = "Alexander Bohlender and Ann Spriet and Wouter Tirry and Nilesh Madhu", title = "Exploiting Temporal Context in {CNN} Based Multisource {DOA} Estimation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1594--1608", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3067113", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yatabe:2021:DBB, author = "Kohei Yatabe and Daichi Kitamura", title = "Determined {BSS} Based on Time-Frequency Masking and Its Application to Harmonic Vector Analysis", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1609--1625", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3073863", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yoon:2021:TTF, author = "Ji Won Yoon and Hyeonseung Lee and Hyung Yong Kim and Won Ik Cho and Nam Soo Kim", title = "{TutorNet}: Towards Flexible Knowledge Distillation for End-to-End Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1626--1638", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3071662", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Singh:2021:SSR, author = "Prachi Singh and Sriram Ganapathy", title = "Self-Supervised Representation Learning With Path Integral Clustering for Speaker Diarization", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1639--1649", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3075100", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wei:2021:GSL, author = "Penghui Wei and Jiahao Zhao and Wenji Mao", title = "A Graph-to-Sequence Learning Framework for Summarizing Opinionated Texts", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1650--1660", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3071667", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Levin:2021:NFS, author = "Dovid Y. Levin and Shmulik Markovich-Golan and Sharon Gannot", title = "Near-Field Superdirectivity: an Analytical Perspective", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1661--1674", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3070686", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hsu:2021:SER, author = "Jia-Hao Hsu and Ming-Hsiang Su and Chung-Hsien Wu and Yi-Hsuan Chen", title = "Speech Emotion Recognition Considering Nonverbal Vocalization in Affective Conversations", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1675--1686", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3076364", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nakamura:2021:TDA, author = "Tomohiko Nakamura and Shihori Kozuka and Hiroshi Saruwatari", title = "Time-Domain Audio Source Separation With Neural Networks Based on Multiresolution Analysis", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1687--1701", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3072496", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2021:FFS, author = "Yun Zhang and Yongguo Liu and Jiajing Zhu and Xindong Wu", title = "{FSPRM}: a Feature Subsequence Based Probability Representation Model for {Chinese} Word Embedding", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1702--1716", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3073868", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2021:MVC, author = "Songxiang Liu and Yuewen Cao and Disong Wang and Xixin Wu and Xunying Liu and Helen Meng", title = "Any-to-Many Voice Conversion With Location-Relative Sequence-to-Sequence Modeling", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1717--1728", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3076867", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chiea:2021:OEB, author = "Rafael A. Chiea and M{\'a}rcio H. Costa and J{\'u}lio A. Cordioli", title = "An Optimal Envelope-Based Noise Reduction Method for Cochlear Implants: an Upper Bound Performance Investigation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1729--1739", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3076363", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Guo:2021:AAE, author = "Junliang Guo and Zhirui Zhang and Linli Xu and Boxing Chen and Enhong Chen", title = "Adaptive Adapters: an Efficient Way to Incorporate {BERT} Into Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1740--1751", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3076863", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Luo:2021:GCC, author = "Yi Luo and Cong Han and Nima Mesgarani", title = "Group Communication With Context Codec for Lightweight Source Separation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1752--1761", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3078640", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xie:2021:HNP, author = "Zhiwen Xie and Runjie Zhu and Jin Liu and Guangyou Zhou and Jimmy Xiangji Huang", title = "Hierarchical Neighbor Propagation With Bidirectional Graph Attention Network for Relation Prediction", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1762--1773", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3079812", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2021:BCM, author = "Xuehan Wang and Jacob Benesty and Jingdong Chen and Gongping Huang and Israel Cohen", title = "Beamforming with Cube Microphone Arrays Via {Kronecker} Product Decompositions", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1774--1784", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3079816", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tan:2021:TMC, author = "Ke Tan and DeLiang Wang", title = "Towards Model Compression for Deep Learning Based Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1785--1794", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3082282", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tesch:2021:NSF, author = "Kristina Tesch and Timo Gerkmann", title = "Nonlinear Spatial Filtering in Multichannel Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1795--1805", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3076372", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2021:ETT, author = "Rui Liu and Berrak Sisman and Guanglai Gao and Haizhou Li", title = "Expressive {TTS} Training With Frame and Style Reconstruction Loss", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1806--1818", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3076369", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qiang:2021:CLS, author = "Jipeng Qiang and Xinyu Lu and Yun Li and Yunhao Yuan and Xindong Wu", title = "{Chinese} Lexical Simplification", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1819--1828", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3078361", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2021:THB, author = "Andong Li and Wenzhe Liu and Chengshi Zheng and Cunhang Fan and Xiaodong Li", title = "Two Heads are Better Than One: a Two-Stage Complex Spectral Mapping Approach for Monaural Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1829--1843", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3079813", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hamdan:2021:WOV, author = "Eric C. Hamdan and Filippo Maria Fazi", title = "Weighted Orthogonal Vector Rejection Method for Loudspeaker-Based Binaural Audio Reproduction", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1844--1852", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3080915", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tan:2021:DLB, author = "Ke Tan and Xueliang Zhang and DeLiang Wang", title = "Deep Learning Based Real-Time Speech Enhancement for Dual-Microphone Mobile Phones", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1853--1863", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3082318", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{SongGong:2021:IMS, author = "Kunkun SongGong and Huawei Chen and Wenwu Wang", title = "Indoor Multi-Speaker Localization Based on {Bayesian} Nonparametrics in the Circular Harmonic Domain", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1864--1880", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3079809", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chinaev:2021:DCC, author = "Aleksej Chinaev and Philipp Th{\"u}ne and Gerald Enzner", title = "Double-Cross-Correlation Processing for Blind Sampling-Rate and Time-Offset Estimation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1881--1896", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3071967", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bai:2021:FEE, author = "Ye Bai and Jiangyan Yi and Jianhua Tao and Zhengkun Tian and Zhengqi Wen and Shuai Zhang", title = "Fast End-to-End Speech Recognition Via Non-Autoregressive Models and Cross-Modal Knowledge Transferring From {BERT}", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1897--1911", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3082299", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kose:2021:MRS, author = "{\"O}yk{\"u} Deniz K{\"o}se and Murat Sara{\c{c}}lar", title = "Multimodal Representations for Synchronized Speech and Real-Time {MRI} Video Processing", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1912--1924", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3084099", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Narendra:2021:DPD, author = "N. P. Narendra and Bj{\"o}rn Schuller and Paavo Alku", title = "The Detection of {Parkinson}'s Disease From Speech Using Voice Source Information", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1925--1936", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3078364", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rehr:2021:SBF, author = "Robert Rehr and Timo Gerkmann", title = "{SNR-Based} Features and Diverse Training Data for Robust {DNN-Based} Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1937--1949", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3082702", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ito:2021:JDB, author = "Nobutaka Ito and Rintaro Ikeshita and Hiroshi Sawada and Tomohiro Nakatani", title = "A Joint Diagonalization Based Efficient Approach to Underdetermined Blind Audio Source Separation Using the Multichannel {Wiener} Filter", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1950--1965", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3079815", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fei:2021:SOS, author = "Hao Fei and Shengqiong Wu and Yafeng Ren and Donghong Ji", title = "Second-Order Semantic Role Labeling With Global Structural Refinement", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1966--1976", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3082706", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Torres:2021:FPD, author = "Humberto M. Torres and Mercedes G{\"u}emes and Jorge A. Gurlekian and Diego A. Evin", title = "{F0} Perturbation Due to Articulatory Movements: Filtering, Characterization and Applications", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1977--1986", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3082671", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Koutini:2021:RFR, author = "Khaled Koutini and Hamid Eghbal-zadeh and Gerhard Widmer", title = "Receptive Field Regularization Techniques for Audio Classification and Tagging With Deep Convolutional Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "1987--2000", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3082307", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2021:MMC, author = "Zhong-Qiu Wang and Peidong Wang and DeLiang Wang", title = "Multi-microphone Complex Spectral Mapping for Utterance-wise and Continuous Speech Separation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2001--2014", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3083405", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2021:RED, author = "Mengjia Zhou and Donghong Ji and Fei Li", title = "Relation Extraction in Dialogues: a Deep Learning Model Based on the Generality and Specialty of Dialogue Text", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2015--2026", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3082295", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nguyen:2021:DSC, author = "Minh Nguyen and Gia H. Ngo and Nancy F. Chen", title = "Domain-Shift Conditioning Using Adaptable Filtering Via Hierarchical Embeddings for Robust {Chinese} Spell Check", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2027--2036", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3083108", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib; https://www.math.utah.edu/pub/tex/bib/spell.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Madmoni:2021:EPT, author = "Lior Madmoni and Shir Tibor and Israel Nelken and Boaz Rafaely", title = "The Effect of Partial Time-Frequency Masking of the Direct Sound on the Perception of Reverberant Speech", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2037--2047", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3084742", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2021:CAG, author = "Haibin Chen and Qianli Ma and Liuhong Yu and Zhenxi Lin and Jiangyue Yan", title = "Corpus-Aware Graph Aggregation Network for Sequence Labeling", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2048--2057", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3084105", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2021:TRS, author = "Heming Wang and DeLiang Wang", title = "Towards Robust Speech Super-Resolution", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2058--2066", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3054302", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yu:2021:AVM, author = "Jianwei Yu and Shi-Xiong Zhang and Bo Wu and Shansong Liu and Shoukang Hu and Mengzhe Geng and Xunying Liu and Helen Meng and Dong Yu", title = "Audio-Visual Multi-Channel Integration and Recognition of Overlapped Speech", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2067--2082", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3078883", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Slizovskaia:2021:CSS, author = "Olga Slizovskaia and Gloria Haro and Emilia G{\'o}mez", title = "Conditioned Source Separation for Musical Instrument Performances", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2083--2095", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3082331", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xie:2021:BLD, author = "Xurong Xie and Xunying Liu and Tan Lee and Lan Wang", title = "{Bayesian} Learning for Deep Neural Network Adaptation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2096--2110", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3084072", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bhattacharjee:2021:NKP, author = "Sankha Subhra Bhattacharjee and Nithin V. George", title = "Nearest {Kronecker} Product Decomposition Based Linear-in-The-Parameters Nonlinear Filters", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2111--2122", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3084755", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2021:MAC, author = "Canguang Li and Guohua Wang and Jin Cao and Yi Cai", title = "A Multi-Agent Communication Based Model for Nested Named Entity Recognition", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2123--2136", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3086978", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ong:2021:BSM, author = "Jonah Ong and Ba Tuong Vo and Sven Nordholm", title = "Blind Separation for Multiple Moving Sources With Labeled Random Finite Sets", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2137--2151", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3087003", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Su:2021:PSD, author = "Yixuan Su and Yan Wang and Deng Cai and Simon Baker and Anna Korhonen and Nigel Collier", title = "{PROTOTYPE-TO-STYLE}: Dialogue Generation With Style-Aware Editing on Retrieval Memory", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2152--2161", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3087948", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bernardini:2021:WDN, author = "Alberto Bernardini and Enrico Bozzo and Federico Fontana and Augusto Sarti", title = "A Wave Digital {Newton--Raphson} Method for Virtual Analog Modeling of Audio Circuits with Multiple One-Port Nonlinearities", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2162--2173", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3084337", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Guo:2021:PNS, author = "Gang Guo and Yi Yu and Rodrigo C. de Lamare and Zongsheng Zheng and Lu Lu and Qiangming Cai", title = "Proximal Normalized Subband Adaptive Filtering for Acoustic Echo Cancellation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2174--2188", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3087951", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liski:2021:AGD, author = "Juho Liski and Aki M{\"a}kivirta and Vesa V{\"a}lim{\"a}ki", title = "Audibility of Group-Delay Equalization", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2189--2201", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3087969", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mim:2021:CAB, author = "Farjana Sultana Mim and Naoya Inoue and Paul Reisert and Hiroki Ouchi and Kentaro Inui", title = "Corruption Is Not All Bad: Incorporating Discourse Structure Into Pre-Training via Corruption for Essay Scoring", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2202--2215", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3088223", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kipnis:2021:GBC, author = "Dror Kipnis and Roee Diamant", title = "Graph-Based Clustering of Dolphin Whistles", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2216--2227", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3091813", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2021:LIA, author = "Yuanyuan Liu and Nelly Penttil{\"a} and Tiina Ihalainen and Juulia Lintula and Rachel Convey and Okko R{\"a}s{\"a}nen", title = "Language-Independent Approach for Automatic Computation of Vowel Articulation Features in Dysarthric Speech Assessment", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2228--2243", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3090973", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Medina:2021:IND, author = "C. Medina and R. Coelho and L. Z{\~a}o", title = "Impulsive Noise Detection for Speech Enhancement in {HHT} Domain", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2244--2253", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3093392", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lopez-Espejo:2021:NLF, author = "Iv{\'a}n L{\'o}pez-Espejo and Zheng-Hua Tan and Jesper Jensen", title = "A Novel Loss Function and Training Strategy for Noise-Robust Keyword Spotting", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2254--2266", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3092567", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2021:RPC, author = "Shansong Liu and Mengzhe Geng and Shoukang Hu and Xurong Xie and Mingyu Cui and Jianwei Yu and Xunying Liu and Helen Meng", title = "Recent Progress in the {CUHK} Dysarthric Speech Recognition System", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2267--2281", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3091805", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2021:DAR, author = "Juan Zhao and Tianrui Zong and Yong Xiang and Longxiang Gao and Wanlei Zhou and Gleb Beliakov", title = "Desynchronization Attacks Resilient Watermarking Method Based on Frequency Singular Value Coefficient Modification", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2282--2295", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3092555", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Coteli:2021:SRL, author = "Mert Burkay {\c{C}}{\"o}teli and H{\"u}seyin Hac{\i}habibo{\u{g}}lu", title = "Sparse Representations With {Legendre} Kernels for {DOA} Estimation and Acoustic Source Separation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2296--2309", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3091845", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Furnon:2021:DBM, author = "Nicolas Furnon and Romain Serizel and Slim Essid and Irina Illina", title = "{DNN}-Based Mask Estimation for Distributed Speech Enhancement in Spatially Unconstrained Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2310--2323", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3092838", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anidjar:2021:HST, author = "Or Haim Anidjar and Itshak Lapidot and Chen Hajaj and Amit Dvir and Issachar Gilad", title = "Hybrid Speech and Text Analysis Methods for Speaker Change Detection", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2324--2338", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3093817", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fan:2021:MTS, author = "Chuang Fan and Chaofa Yuan and Lin Gui and Yue Zhang and Ruifeng Xu", title = "Multi-Task Sequence Tagging for Emotion-Cause Pair Extraction Via Tag Distribution Refinement", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2339--2350", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3089837", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2021:TSS, author = "Andy T. Liu and Shang-Wen Li and Hung-yi Lee", title = "{TERA}: Self-Supervised Learning of Transformer Encoder Representation for Speech", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2351--2366", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3095662", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2021:CFA, author = "Guanlong Zhao and Shaojin Ding and Ricardo Gutierrez-Osuna", title = "Converting Foreign Accent Speech Without a Reference", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2367--2381", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3060813", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schulze-Forster:2021:PLL, author = "Kilian Schulze-Forster and Clement S. J. Doire and Ga{\"e}l Richard and Roland Badeau", title = "Phoneme Level Lyrics Alignment and Text-Informed Singing Voice Separation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2382--2395", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3091817", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2021:HOP, author = "Shengqiong Wu and Hao Fei and Yafeng Ren and Bobo Li and Fei Li and Donghong Ji", title = "High-Order Pair-Wise Aspect and Opinion Terms Extraction With Edge-Enhanced Syntactic Graph Convolution", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2396--2406", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3095672", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2021:STS, author = "Jingyi Wu and Lin Shang and Xiaoying Gao", title = "Sentiment Time Series Calibration for Event Detection", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2407--2420", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3096653", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Munir:2021:LCA, author = "Kashif Munir and Hai Zhao and Zuchao Li", title = "Learning Context-Aware Convolutional Filters for Implicit Discourse Relation Classification", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2421--2433", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3096041", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kim:2021:ESI, author = "Seokhwan Kim and Hannes Schulz and Chulaka Gunasekara and Chiori Hori and Abhinav Rastogi and Luis Fernando D. Haro", title = "Editorial: Special Issue on the Eighth Dialog System Technology Challenge", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2434--2436", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3097842", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kim:2021:RWN, author = "Byoungjae Kim and Jungyun Seo and Myoung-Wan Koo", title = "Randomly Wired Network Based on {RoBERTa} and Dialog History Attention for Response Selection", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2437--2442", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3077119", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gu:2021:DCU, author = "Jia-Chen Gu and Tianda Li and Zhen-Hua Ling and Quan Liu and Zhiming Su and Yu-Ping Ruan and Xiaodan Zhu", title = "Deep Contextualized Utterance Representations for Response Selection and Dialogue Analysis", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2443--2455", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3074788", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chu:2021:EER, author = "Yun-Wei Chu and Kuan-Yen Lin and Chao-Chun Hsu and Lun-Wei Ku", title = "End-to-End Recurrent Cross-Modality Attention for Video Dialogue", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2456--2464", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3065852", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2021:CSR, author = "Kun Xu and Han Wu and Linfeng Song and Haisong Zhang and Linqi Song and Dong Yu", title = "Conversational Semantic Role Labeling", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2465--2475", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3074014", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2021:BTV, author = "Zekang Li and Zongjia Li and Jinchao Zhang and Yang Feng and Jie Zhou", title = "Bridging Text and Video: a Universal Multimodal Transformer for Audio-Visual Scene-Aware Dialog", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2476--2483", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3065823", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shalyminov:2021:GGR, author = "Igor Shalyminov and Alessandro Sordoni and Adam Atkinson and Hannes Schulz", title = "{GRTr}: Generative-Retrieval Transformers for Data-Efficient Dialogue Domain Adaptation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2484--2492", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3074779", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zeng:2021:DAM, author = "Jiali Zeng and Yongjing Yin and Yang Liu and Yubin Ge and Jinsong Su", title = "Domain Adaptive Meta-Learning for Dialogue State Tracking", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2493--2501", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3080182", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2021:DSH, author = "Chen Zhang and Grandee Lee and Luis Fernando D. Haro and Haizhou Li", title = "{D-Score}: Holistic Dialogue Evaluation Without Reference", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2502--2516", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3074012", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Malviya:2021:HHD, author = "Shrikant Malviya and Rohit Mishra and Santosh Kumar Barnwal and Uma Shanker Tiwary", title = "{HDRS}: {Hindi} Dialogue Restaurant Search Corpus for Dialogue State Tracking in Task-Oriented Environment", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2517--2528", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3065833", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kim:2021:OED, author = "Seokhwan Kim and Michel Galley and Chulaka Gunasekara and Sungjin Lee and Adam Atkinson and Baolin Peng and Hannes Schulz and Jianfeng Gao and Jinchao Li and Mahmoud Adada and Minlie Huang and Luis Lastras and Jonathan K. Kummerfeld and Walter S. Lasecki and Chiori Hori and Anoop Cherian and Tim K. Marks and Abhinav Rastogi and Xiaoxue Zang and Srinivas Sunkara and Raghav Gupta", title = "Overview of the {Eighth Dialog System Technology Challenge: DSTC8}", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2529--2540", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3078368", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jeong:2021:LCA, author = "Myeongho Jeong and Seungtaek Choi and Jinyoung Yeo and Seung-won Hwang", title = "Label and Context Augmentation for Response Selection at {DSTC8}", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2541--2550", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3076876", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2021:HRB, author = "Qing Liu and Lei Chen and Yuan Yuan and Huarui Wu", title = "History Reuse and Bag-of-Words Loss for Long Summary Generation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2551--2560", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3100281", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2021:PPE, author = "Lu Zhang and Mingjiang Wang and Qiquan Zhang and Xinsheng Wang and Ming Liu", title = "{PhaseDCN}: a Phase-Enhanced Dual-Path Dilated Convolutional Network for Single-Channel Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2561--2574", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3092585", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Haque:2021:GGA, author = "Kazi Nazmul Haque and Rajib Rana and Jiajun Liu and John H. L. Hansen and Nicholas Cummins and Carlos Busso and Bj{\"o}rn W. Schuller", title = "Guided Generative Adversarial Neural Network for Representation Learning and Audio Generation Using Fewer Labelled Audio Data", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2575--2590", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3098764", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nakashika:2021:GBM, author = "Toru Nakashika and Kohei Yatabe", title = "Gamma {Boltzmann} Machine for Audio Modeling", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2591--2605", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3095656", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2021:AFN, author = "Xintong Li and Lemao Liu and Zhaopeng Tu and Guanlin Li and Shuming Shi and Max Q.-H. Meng", title = "Attending From Foresight: a Novel Attention Mechanism for Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2606--2616", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3097939", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2021:IFA, author = "Hengshun Zhou and Jun Du and Yuanyuan Zhang and Qing Wang and Qing-Feng Liu and Chin-Hui Lee", title = "Information Fusion in Attention Networks Using Adaptive and Multi-Level Factorized Bilinear Pooling for Audio-Visual Emotion Recognition", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2617--2629", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3096037", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2021:LCL, author = "Yuling Li and Kui Yu and Yuhong Zhang", title = "Learning Cross-Lingual Mappings in Imperfectly Isomorphic Embedding Spaces", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2630--2642", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3097935", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2021:USS, author = "Xiao Zhou and Zhen-Hua Ling and Li-Rong Dai", title = "{UnitNet}: a Sequence-to-Sequence Acoustic Model for Concatenative Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2643--2655", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3093823", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pan:2021:MTP, author = "Zihan Pan and Malu Zhang and Jibin Wu and Jiadong Wang and Haizhou Li", title = "Multi-Tone Phase Coding of Interaural Time Difference for Sound Source Localization With Spiking Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2656--2670", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3100684", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{OHanlon:2021:FSC, author = "Ken {O Hanlon} and Mark B. Sandler", title = "{FifthNet}: Structured Compact Neural Networks for Automatic Chord Recognition", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2671--2682", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3070158", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Spagnol:2021:ESN, author = "Simone Spagnol and Riccardo Miccini and Marius George Onofrei and Runar Unnthorsson and Stefania Serafin", title = "Estimation of Spectral Notches From Pinna Meshes: Insights From a Simple Computational Model", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2683--2695", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3101928", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2021:TSV, author = "Chenglin Xu and Wei Rao and Jibin Wu and Haizhou Li", title = "Target Speaker Verification With Selective Auditory Attention for Single and Multi-Talker Speech", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2696--2709", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3100682", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zahedi:2021:MPB, author = "Adel Zahedi and Michael Syskind Pedersen and Jan {\O}stergaard and Thomas Ulrich Christiansen and Lars Bramsl{\o}w and Jesper Jensen", title = "Minimum Processing Beamforming", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2710--2724", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3053411", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2021:MIN, author = "Xianghui Wang and Jie Chen and Xiaoyi Chen and Jing Guo and Qian Xiang", title = "Multichannel Iterative Noise Reduction Filters in the Short-Time-Fourier-Transform Domain Based on {Kronecker} Product Decomposition", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2725--2740", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3092825", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yin:2021:RQG, author = "Kai-Li Yin and Yi-Fei Pu and Lu Lu", title = "Robust {Q}-Gradient Subband Adaptive Filter for Nonlinear Active Noise Control", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2741--2752", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3102193", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Byun:2021:MSS, author = "Jaeuk Byun and Jong Won Shin", title = "Monaural Speech Separation Using Speaker Embedding From Preliminary Separation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2753--2763", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3101617", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2021:DSB, author = "Xudong Zhao and Gongping Huang and Jingdong Chen and Jacob Benesty", title = "On the Design of {3D} Steerable Beamformers With Uniform Concentric Circular Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2764--2778", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3103129", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cheng:2021:UTO, author = "Zifeng Cheng and Zhiwei Jiang and Yafeng Yin and Na Li and Qing Gu", title = "A Unified Target-Oriented Sequence-to-Sequence Model for Emotion-Cause Pair Extraction", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2779--2791", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3102194", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Azadi:2021:RVF, author = "Hamid Azadi and Mohammad-R. Akbarzadeh-T and Hamid-R. Kobravi and Ali Shoeibi", title = "Robust Voice Feature Selection Using Interval Type-2 Fuzzy {AHP} for Automated Diagnosis of {Parkinson}'s Disease", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2792--2802", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3097215", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hono:2021:SDN, author = "Yukiya Hono and Kei Hashimoto and Keiichiro Oura and Yoshihiko Nankaku and Keiichi Tokuda", title = "Sinsy: a Deep Neural Network-Based Singing Voice Synthesis System", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2803--2815", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3104165", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tang:2021:MGS, author = "Jian Tang and Jie Zhang and Yan Song and Ian McLoughlin and Li-Rong Dai", title = "Multi-Granularity Sequence Alignment Mapping for Encoder-Decoder Based End-to-End {ASR}", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2816--2828", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3101921", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Leong:2021:ETM, author = "Chongman Leong and Xuebo Liu and Derek F. Wong and Lidia S. Chao", title = "Exploiting Translation Model for Parallel Corpus Mining", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2829--2839", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3105798", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zeghidour:2021:WEE, author = "Neil Zeghidour and David Grangier", title = "{Wavesplit}: End-to-End Speech Separation by Speaker Clustering", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2840--2849", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3099291", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Oglic:2021:LWB, author = "Dino Oglic and Zoran Cvetkovic and Peter Sollich", title = "Learning Waveform-Based Acoustic Models Using Deep Variational Convolutional Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2850--2863", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3104193", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nelus:2021:PPA, author = "Alexandru Nelus and Rainer Martin", title = "Privacy-Preserving Audio Classification Using Variational Information Feature Extraction", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2864--2877", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3108063", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2021:RNN, author = "Hao Li and DeLiang Wang and Xueliang Zhang and Guanglai Gao", title = "Recurrent Neural Networks and Acoustic Features for Frame-Level Signal-to-Noise Ratio Estimation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2878--2887", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3107617", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2021:GRG, author = "Yi Zhou and Xiaoqing Zheng and Xuanjing Huang", title = "Generating Responses With a Given Syntactic Pattern in {Chinese} Dialogues", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2888--2898", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3110124", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gunnarsson:2021:BAM, author = "Viktor Gunnarsson and Mikael Sternad", title = "Binaural Auralization of Microphone Array Room Impulse Responses Using Causal {Wiener} Filtering", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2899--2914", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3110340", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2021:SIT, author = "Zuolong Chen and Huawei Chen and Quansheng Tu", title = "Sensor Imperfection Tolerance Analysis of Robust Linear Differential Microphone Arrays", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2915--2929", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3110136", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Su:2021:CLC, author = "Yusheng Su and Xu Han and Yankai Lin and Zhengyan Zhang and Zhiyuan Liu and Peng Li and Jie Zhou and Maosong Sun", title = "{CSS-LM}: a Contrastive Framework for Semi-Supervised Fine-Tuning of Pre-Trained Language Models", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2930--2941", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3105013", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kabzinski:2021:CCF, author = "Tobias Kabzinski and Peter Jax", title = "A Causality-Constrained Frequency-Domain Least-Squares Filter Design Method for Crosstalk Cancellation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2942--2956", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3110651", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zalkow:2021:CBL, author = "Frank Zalkow and Meinard M{\"u}ller", title = "{CTC-Based} Learning of Chroma Features for Score Audio Music Retrieval", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2957--2971", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3110137", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chan:2021:MBC, author = "Teck Kai Chan and Cheng Siong Chin", title = "Multi-Branch Convolutional Macaron net for Sound Event Detection", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2972--2985", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3110649", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kourkounakis:2021:FEE, author = "Tedd Kourkounakis and Amirhossein Hajavi and Ali Etemad", title = "{FluentNet}: End-to-End Detection of Stuttered Speech Disfluencies With Deep Learning", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "2986--2999", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3110146", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2021:MMO, author = "Haoyu Li and Junichi Yamagishi", title = "Multi-Metric Optimization Using Generative Adversarial Networks for Near-End Speech Intelligibility Enhancement", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3000--3011", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3111566", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lin:2021:PTD, author = "Zehao Lin and Shaobo Cui and Guodun Li and Xiaoming Kang and Feng Ji and Fenglin Li and Zhongzhou Zhao and Haiqing Chen and Yin Zhang", title = "Predict-Then-Decide: a Predictive Approach for Wait or Answer Task in Dialogue Systems", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3012--3024", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3110145", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Calis:2021:LBE, author = "Metin Calis and Steven van de Par and Richard Heusdens and Richard Christian Hendriks", title = "Localization Based on Enhanced Low Frequency Interaural Level Difference", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3025--3039", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3111583", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liberatore:2021:NNV, author = "Christopher Liberatore", title = "Native-Nonnative Voice Conversion by Residual Warping in a Sparse, Anchor-Based Representation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3040--3051", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3111568", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Koyama:2021:SAN, author = "Shoichi Koyama and Jesper Brunnstr{\"o}m and Hayato Ito and Natsuki Ueno and Hiroshi Saruwatari", title = "Spatial Active Noise Control Based on Kernel Interpolation of Sound Field", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3052--3063", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3107983", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qiang:2021:LLS, author = "Jipeng Qiang and Yun Li and Yi Zhu and Yunhao Yuan and Yang Shi and Xindong Wu", title = "{LSBert}: Lexical Simplification Based on {BERT}", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3064--3076", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3111589", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2021:CIE, author = "Ningyu Zhang and Hongbin Ye and Shumin Deng and Chuanqi Tan and Mosha Chen and Songfang Huang and Fei Huang and Huajun Chen", title = "Contrastive Information Extraction With Generative Transformer", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3077--3088", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3110126", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2021:MVM, author = "Jianyu Wang and Shanzheng Guan and Shupei Liu and Xiao-Lei Zhang", title = "Minimum-Volume Multichannel Nonnegative Matrix Factorization for Blind Audio Source Separation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3089--3103", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120603", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Carini:2021:RIR, author = "Alberto Carini and Stefania Cecchi and Alessandro Terenzi and Simone Orcioni", title = "A Room Impulse Response Measurement Method Robust Towards Nonlinearities Based on Orthogonal Periodic Sequences", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3104--3117", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120595", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2021:QAB, author = "Jie Zhang and Changheng Li", title = "Quantization-Aware Binaural {MWF} Based Noise Reduction Incorporating External Wireless Devices", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3118--3131", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120639", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhu:2021:KEF, author = "Biru Zhu and Xingyao Zhang and Ming Gu and Yangdong Deng", title = "Knowledge Enhanced Fact Checking and Verification", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3132--3143", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120636", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Poletti:2021:STM, author = "Mark A. Poletti and Paul D. Teal", title = "A Superfast {Toeplitz} Matrix Inversion Method for Single- and Multi-Channel Inverse Filters and Its Application to Room Equalization", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3144--3157", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120650", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2021:DSC, author = "Guanlin Li and Lemao Liu and Conghui Zhu and Rui Wang and Tiejun Zhao and Shuming Shi", title = "Detecting Source Contextual Barriers for Understanding Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3158--3169", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3085119", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kuo:2021:AAS, author = "Chia-Chih Kuo and Kuan-Yu Chen and Shang-Bao Luo", title = "Audio-Aware Spoken Multiple-Choice Question Answering With Pre-Trained Language Models", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3170--3179", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120638", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2021:AEG, author = "Rui Liu and Zheng Lin and Weiping Wang", title = "Addressing Extraction and Generation Separately: Keyphrase Prediction With Pre-Trained Language Models", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3180--3191", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120587", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2021:SDC, author = "Jiangnan Li and Hongliang Pan and Zheng Lin and Peng Fu and Weiping Wang", title = "Sarcasm Detection with Commonsense Knowledge", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3192--3201", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120601", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2021:KSU, author = "Runyan Yang and Gaofeng Cheng and Haoran Miao and Ta Li and Pengyuan Zhang and Yonghong Yan", title = "Keyword Search Using Attention-Based End-to-End {ASR} and Frame-Synchronous Phoneme Alignments", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3202--3215", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120632", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Alkhaldi:2021:FFS, author = "Tareq Alkhaldi and Chenhui Chu and Sadao Kurohashi", title = "Flexibly Focusing on Supporting Facts, Using Bridge Links, and Jointly Training Specialized Modules for Multi-Hop Question Answering", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3216--3225", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120643", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2021:EFB, author = "Wenyi Wu and Yegui Xiao and Jianhui Lin and Liying Ma and Khashayar Khorasani", title = "An Efficient Filter Bank Structure for Adaptive Notch Filtering and Applications", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3226--3241", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120600", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2021:SSD, author = "Xinsheng Wang and Justin van der Hout and Jihua Zhu and Mark Hasegawa-Johnson and Odette Scharenborg", title = "Synthesizing Spoken Descriptions of Images", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3242--3254", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120644", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Neo:2021:ENR, author = "Vincent W. Neo and Christine Evers and Patrick A. Naylor", title = "Enhancement of Noisy Reverberant Speech Using Polynomial Matrix Eigenvalue Decomposition", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3255--3266", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120630", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Giampiccolo:2021:WDM, author = "Riccardo Giampiccolo and Mauro Giuseppe de Bari and Alberto Bernardini and Augusto Sarti", title = "Wave Digital Modeling and Implementation of Nonlinear Audio Circuits With Nullors", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3267--3279", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120627", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2021:SER, author = "Xixin Wu and Yuewen Cao and Hui Lu and Songxiang Liu and Disong Wang and Zhiyong Wu and Xunying Liu and Helen Meng", title = "Speech Emotion Recognition Using Sequential Capsule Networks", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3280--3291", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120586", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gong:2021:PIA, author = "Yuan Gong and Yu-An Chung and James Glass", title = "{PSLA}: Improving Audio Tagging With Pretraining, Sampling, Labeling, and Aggregation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3292--3306", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120633", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2021:RAC, author = "Licheng Zhang and Zhendong Mao and Benfeng Xu and Quan Wang and Yongdong Zhang", title = "Review and Arrange: Curriculum Learning for Natural Language Understanding", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3307--3320", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3121986", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{He:2021:ADA, author = "Fei He and Ling He and Jing Zhang and Yuanyuan Li and Xi Xiong", title = "Automatic Detection of Affective Flattening in Schizophrenia: Acoustic Correlates to Sound Waves and Auditory Perception", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3321--3334", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120591", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bouzid:2021:ELA, author = "Saoussen Mathlouthi Bouzid and Chiraz Ben Othmane Zribi", title = "Efficient Learning Approach for Pronominal Anaphora and Ellipsis Identification and Resolution in {Arabic} Texts", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3335--3348", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120649", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yuksel:2021:SCD, author = "Arda Y{\"u}ksel and Berke U{\u{g}}urlu and Aykut Ko{\c{c}}", title = "Semantic Change Detection With {Gaussian} Word Embeddings", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3349--3361", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120645", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2021:MTS, author = "Mei Li and Lu Xiang and Xiaomian Kang and Yang Zhao and Yu Zhou and Chengqing Zong", title = "Medical Term and Status Generation From {Chinese} Clinical Dialogue With Multi-Granularity Transformer", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3362--3374", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3122301", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2021:NRG, author = "Yongwei Li and Jianhua Tao and Donna Erickson and Bin Liu and Masato Akagi", title = "{$ F_0 $}-Noise-Robust Glottal Source and Vocal Tract Analysis Based on {ARX-LF} Model", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3375--3383", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120585", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liao:2021:EES, author = "Xianwen Liao and Yongzhong Huang and Yongzhuang Wei and Chenhao Zhang and Fu Wang and Yong Wang", title = "Efficient Estimate of Sentence's Representation Based on the Difference Semantics Model", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3384--3399", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3123885", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jeon:2021:TNT, author = "Kwang Myung Jeon and Geon Woo Lee and Nam Kyun Kim and Hong Kook Kim", title = "{TAU-Net}: Temporal Activation {$U$}-Net Shared With Nonnegative Matrix Factorization for Speech Enhancement in Unseen Noise Environments", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3400--3414", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3067154", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ding:2021:RSS, author = "Yi-Yang Ding and Hao-Jian Lin and Li-Juan Liu and Zhen-Hua Ling and Yu Hu", title = "Robustness of Speech Spoofing Detectors Against Adversarial Post-Processing of Voice Conversion", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3415--3426", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3124420", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2021:LAS, author = "Yi Zhou and Xiaohai Tian and Haizhou Li", title = "Language Agnostic Speaker Embedding for Cross-Lingual Personalized Speech Generation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3427--3439", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3125142", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lin:2021:SEU, author = "Ju Lin and Adriaan J. de Lind van Wijngaarden and Kuang-Ching Wang and Melissa C. Smith", title = "Speech Enhancement Using Multi-Stage Self-Attentive Temporal Convolutional Networks", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3440--3450", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3125143", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hsu:2021:HSS, author = "Wei-Ning Hsu and Benjamin Bolte and Yao-Hung Hubert Tsai and Kushal Lakhotia and Ruslan Salakhutdinov and Abdelrahman Mohamed", title = "{HuBERT}: Self-Supervised Speech Representation Learning by Masked Prediction of Hidden Units", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3451--3460", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3122291", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yamaoka:2021:TFW, author = "Kouei Yamaoka and Nobutaka Ono and Shoji Makino", title = "Time-Frequency-Bin-Wise Linear Combination of Beamformers for Distortionless Signal Enhancement", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3461--3475", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3126950", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2021:CPM, author = "Zhong-Qiu Wang and Gordon Wichern and Jonathan {Le Roux}", title = "Convolutive Prediction for Monaural Speech Dereverberation and Noisy-Reverberant Speaker Separation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3476--3490", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3129363", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2021:LDD, author = "Bing Yang and Hong Liu and Xiaofei Li", title = "Learning Deep Direct-Path Relative Transfer Function for Binaural Sound Source Localization", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3491--3503", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120641", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cui:2021:PTW, author = "Yiming Cui and Wanxiang Che and Ting Liu and Bing Qin and Ziqing Yang", title = "Pre-Training With Whole Word Masking for {Chinese} {BERT}", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3504--3514", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3124365", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sar:2021:CFA, author = "Leda {Sar } and Mark Hasegawa-Johnson and Chang D. Yoo", title = "Counterfactually Fair Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3515--3525", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3126949", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2021:MCM, author = "Zhuohuang Zhang and Yong Xu and Meng Yu and Shi-Xiong Zhang and Lianwu Chen and Donald S. Williamson and Dong Yu", title = "Multi-Channel Multi-Frame {ADL-MVDR} for Target Speech Separation", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3526--3540", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3129335", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Westhausen:2021:RSL, author = "Nils L. Westhausen and Rainer Huber and Hannah Baumgartner and Ragini Sinha and Jan Rennies and Bernd T. Meyer", title = "Reduction of Subjective Listening Effort for {TV} Broadcast Signals With Recurrent Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3541--3550", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3126931", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sasaki:2021:SBC, author = "Shota Sasaki and Jun Suzuki and Kentaro Inui", title = "Subword-Based Compact Reconstruction for Open-Vocabulary Neural Word Embeddings", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3551--3564", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3125133", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cui:2021:ADD, author = "Xiaodong Cui and Wei Zhang and Abdullah Kayi and Mingrui Liu and Ulrich Finkler and Brian Kingsbury and George Saon and David Kung", title = "Asynchronous Decentralized Distributed Training of Acoustic Models", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3565--3576", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3122349", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2021:SAN, author = "Junqing Zhang and Wen Zhang and Jihui Aimee Zhang and Thushara Dheemantha Abhayapala and Lijun Zhang", title = "Spatial Active Noise Control in Rooms Using Higher Order Sources", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3577--3591", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3126936", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2021:MER, author = "Bingzhi Chen and Qi Cao and Mixiao Hou and Zheng Zhang and Guangming Lu and David Zhang", title = "Multimodal Emotion Recognition With Temporal and Semantic Consistency", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3592--3603", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3129331", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Supraja:2021:RPB, author = "S. Supraja and Andy W. H. Khong and S. Tatinati", title = "Regularized Phrase-Based Topic Model for Automatic Question Classification With Domain-Agnostic Class Labels", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3604--3616", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3126937", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Maeda:2021:SFR, author = "Natsuko Maeda and Filippo Maria Fazi and Falk-Martin Hoffmann", title = "Sound Field Reproduction With a Cylindrical Loudspeaker Array Using First Order Wall Reflections", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3617--3630", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120590", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lu:2021:CGM, author = "Xugang Lu and Peng Shen and Yu Tsao and Hisashi Kawai", title = "Coupling a Generative Model With a Discriminative Learning Framework for Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3631--3641", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3129360", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Helmholz:2021:EAN, author = "Hannes Helmholz and David Lou Alon and Sebasti{\`a} V. Amengual Gar{\'\i} and Jens Ahrens", title = "Effects of Additive Noise in Binaural Rendering of Spherical Microphone Array Signals", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3642--3653", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3129359", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hong:2021:SRR, author = "Joanna Hong and Minsu Kim and Se Jin Park and Yong Man Ro", title = "Speech Reconstruction With Reminiscent Sound Via Visual Voice Memory", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3654--3667", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3126925", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Weisman:2021:RAR, author = "Ran Weisman and Tom Shlomo and Vladimir Tourbabin and Paul Calamia and Boaz Rafaely", title = "Robustness of Acoustic Rake Filters in Minimum Variance Beamforming", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3668--3678", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3126946", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2021:MPL, author = "Junhao Xu and Jianwei Yu and Shoukang Hu and Xunying Liu and Helen Meng", title = "Mixed Precision Low-Bit Quantization of Neural Network Language Models for Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3679--3693", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3129357", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ge:2021:LFG, author = "Jidong Ge and Yunyun Huang and Xiaoyu Shen and Chuanyi Li and Wei Hu", title = "Learning Fine-Grained Fact-Article Correspondence in Legal Cases", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3694--3706", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3130992", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kong:2021:HRP, author = "Qiuqiang Kong and Bochen Li and Xuchen Song and Yuan Wan and Yuxuan Wang", title = "High-Resolution Piano Transcription With Pedals by Regressing Onset and Offset Times", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3707--3717", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3121991", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2021:IIA, author = "Anonymous", title = "{2021 Index \booktitle{IEEE/ACM Transactions on Audio, Speech, and Language Processing Vol. 29}}", journal = j-IEEE-ACM-TASLP, volume = "29", number = "??", pages = "3718--3760", year = "2021", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3147096", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Anonymous:2022:ISP, author = "Anonymous", title = "{IEEE Signal Processing Society}", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "C2--C2", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3137075", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2022:RRO, author = "Qianying Liu and Wenyu Guan and Sujian Li and Fei Cheng and Daisuke Kawahara and Sadao Kurohashi", title = "{RODA}: Reverse Operation Based Data Augmentation for Solving Math Word Problems", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1--11", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3126932", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhen:2022:SEN, author = "Kai Zhen and Jongmo Sung and Mi Suk Lee and Seungkwon Beack and Minje Kim", title = "Scalable and Efficient Neural Speech Coding: a Hybrid Design", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "12--25", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3129353", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2022:TGD, author = "Sen Yang and Yang Liu and Dawei Feng and Dongsheng Li", title = "Text Generation From Data With Dynamic Planning", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "26--34", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3129346", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liebich:2022:OEC, author = "Stefan Liebich and Peter Vary", title = "Occlusion Effect Cancellation in Headphones and Hearing Devices The Sister of Active Noise Cancellation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "35--48", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3130966", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2022:WAK, author = "Zhuosheng Zhang and Haojie Yu and Hai Zhao and Masao Utiyama", title = "Which Apple Keeps Which Doctor Away? {Colorful} Word Representations With Visual Oracles", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "49--59", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3130972", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2022:MSD, author = "Zhenyu Wang and John H. L. Hansen", title = "Multi-Source Domain Adaptation for Text-Independent Forensic Speaker Recognition", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "60--75", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3130975", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zheng:2022:UCE, author = "Kengtao Zheng and Nankai Lin and Shengyi Jiang", title = "Unsupervised Character Embedding Correction and Candidate Word Denoising", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "76--86", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3129334", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ma:2022:EDS, author = "Bing Ma and Haifeng Sun and Jingyu Wang and Qi Qi and Jianxin Liao", title = "Extractive Dialogue Summarization Without Annotation Based on Distantly Supervised Machine Reading Comprehension in Customer Service", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "87--97", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3133206", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2022:ECO, author = "Shengcai Liu and Ning Lu and Cheng Chen and Ke Tang", title = "Efficient Combinatorial Optimization for Word-Level Adversarial Textual Attack", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "98--111", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3130970", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Terenzi:2022:CFE, author = "Alessandro Terenzi and Nicola Ortolani and In{\^e}s Nolasco and Emmanouil Benetos and Stefania Cecchi", title = "Comparison of Feature Extraction Methods for Sound-Based Classification of Honey Bee Activity", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "112--122", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3133194", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mao:2022:ESB, author = "Shuiyang Mao and P. C. Ching and Tan Lee", title = "Enhancing Segment-Based Speech Emotion Recognition by Iterative Self-Learning", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "123--134", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3133195", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shahrebabaki:2022:AAM, author = "Abdolreza Sabzi Shahrebabaki and Giampiero Salvi and Torbj{\o}rn Svendsen and Sabato Marco Siniscalchi", title = "Acoustic-to-Articulatory Mapping With Joint Optimization of Deep Speech Enhancement and Articulatory Inversion Models", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "135--147", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3133218", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jorge:2022:LSS, author = "Javier Jorge and Adri{\`a} Gim{\'e}nez and Joan Albert Silvestre-Cerd{\`a} and Jorge Civera and Albert Sanchis and Alfons Juan", title = "Live Streaming Speech Recognition Using Deep Bidirectional {LSTM} Acoustic Models and Interpolated Language Models", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "148--161", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3133216", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shifas:2022:EEN, author = "Muhammed P. V. Shifas and C{\u{a}}t{\u{a}}lin Zoril{\u{a}} and Yannis Stylianou", title = "End-to-End Neural Based Modification of Noisy Speech for Speech-in-Noise Intelligibility Improvement", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "162--173", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3126947", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2022:VWV, author = "Joon-Young Yang and Joon-Hyuk Chang", title = "{VACE-WPE}: Virtual Acoustic Channel Expansion Based on Neural Networks for Weighted Prediction Error-Based Speech Dereverberation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "174--189", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3133190", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Du:2022:PLP, author = "Chenpeng Du and Kai Yu", title = "Phone-Level Prosody Modelling With {GMM}-Based {MDN} for Diverse and Controllable Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "190--201", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3133205", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2022:IAR, author = "Haibin Wu and Xu Li and Andy T. Liu and Zhiyong Wu and Helen Meng and Hung-Yi Lee", title = "Improving the Adversarial Robustness for Speaker Verification by Self-Supervised Learning", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "202--217", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3133189", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hou:2022:MVS, author = "Mixiao Hou and Zheng Zhang and Qi Cao and David Zhang and Guangming Lu", title = "Multi-View Speech Emotion Recognition Via Collective Relation Construction", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "218--229", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3133196", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2022:LPR, author = "Da-rong Liu and Po-chun Hsu and Yi-chen Chen and Sung-feng Huang and Shun-po Chuang and Da-yi Wu and Hung-yi Lee", title = "Learning Phone Recognition From Unpaired Audio and Phone Sequences Based on Generative Adversarial Network", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "230--243", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138720", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2022:WRA, author = "Yuting Zhao and Mamoru Komachi and Tomoyuki Kajiwara and Chenhui Chu", title = "Word-Region Alignment-Guided Multimodal Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "244--259", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138719", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2022:SAM, author = "Zhuosheng Zhang and Yiqing Zhang and Hai Zhao", title = "Syntax-Aware Multi-Spans Generation for Reading Comprehension", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "260--268", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138679", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhu:2022:DRC, author = "Pengfei Zhu and Zhuosheng Zhang and Hai Zhao and Xiaoguang Li", title = "{DUMA}: Reading Comprehension With Transposition Thinking", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "269--279", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138683", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xie:2022:DDG, author = "Jiayuan Xie and Ningxin Peng and Yi Cai and Tao Wang and Qingbao Huang", title = "Diverse Distractor Generation for Constructing High-Quality Multiple Choice Questions", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "280--291", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138706", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2022:PUB, author = "Jie Zhang and Guanghui Zhang", title = "A Parametric Unconstrained Beamformer Based Binaural Noise Reduction for Assistive Hearing", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "292--304", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138675", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Turchet:2022:MER, author = "Luca Turchet and Johan Pauwels", title = "Music Emotion Recognition: Intention of Composers-Performers Versus Perception of Musicians, Non-Musicians, and Listening Machines", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "305--316", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138709", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hou:2022:EAC, author = "Wenxin Hou and Han Zhu and Yidong Wang and Jindong Wang and Tao Qin and Renjun Xu and Takahiro Shinozaki", title = "Exploiting Adapters for Cross-Lingual Low-Resource Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "317--329", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138674", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2022:IPT, author = "Kehai Chen and Rui Wang and Masao Utiyama and Eiichiro Sumita", title = "Integrating Prior Translation Knowledge Into Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "330--339", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138714", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Deng:2022:AAL, author = "Keqi Deng and Gaofeng Cheng and Runyan Yang and Yonghong Yan", title = "Alleviating {ASR} Long-Tailed Problem by Decoupling the Learning of Representation and Classification", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "340--354", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138707", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2022:HIJ, author = "Zuchao Li and Junru Zhou and Hai Zhao and Kevin Parnow", title = "{HPSG}-Inspired Joint Neural Constituent and Dependency Parsing in {$ O(n^3) $} Time Complexity", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "355--366", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138715", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shi:2022:USR, author = "Xuan Shi and Erica Cooper and Junichi Yamagishi", title = "Use of Speaker Recognition Approaches for Learning and Evaluating Embedding Representations of Musical Instrument Sounds", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "367--377", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3140549", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yao:2022:SRS, author = "Zengwei Yao and Wenjie Pei and Fanglin Chen and Guangming Lu and David Zhang", title = "Stepwise-Refining Speech Separation Network via Fine-Grained Encoding in High-Order Latent Domain", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "378--393", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3140556", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qian:2022:ODU, author = "Yanmin Qian and Zhikai Zhou", title = "Optimizing Data Usage for Low-Resource Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "394--403", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3140552", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mary:2022:VTS, author = "Narla John Metilda Sagaya Mary and Srinivasan Umesh and Sandesh Varadaraju Katta", title = "{S}-Vectors and {TESA}: Speaker Embeddings and a Speaker Authenticator Based on Transformer Encoder", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "404--413", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3134566", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Borgstrom:2022:BEP, author = "Bengt J. Borgstr{\"o}m", title = "{Bayesian} Estimation of {PLDA} in the Presence of Noisy Training Labels, With Applications to Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "414--428", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3130980", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lu:2022:SFR, author = "Menglong Lu and Zhen Huang and Binyang Li and Yunxiang Zhao and Zheng Qin and DongSheng Li", title = "{SIFTER}: a Framework for Robust Rumor Detection", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "429--442", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3140474", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2022:PSE, author = "Lantian Li and Dong Wang and Jiawen Kang and Renyu Wang and Jing Wu and Zhendong Gao and Xiao Chen", title = "A Principle Solution for Enroll-Test Mismatch in Speaker Recognition", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "443--455", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3140558", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2022:ADL, author = "Feiran Yang", title = "Analysis of Deficient-Length Partitioned-Block Frequency-Domain Adaptive Filters", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "456--467", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138671", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jiang:2022:ASE, author = "Hui Jiang and Linfeng Song and Yubin Ge and Fandong Meng and Junfeng Yao and Jinsong Su", title = "An {AST} Structure Enhanced Decoder for Code Generation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "468--476", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138717", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kanervisto:2022:OTS, author = "Anssi Kanervisto and Ville Hautam{\"a}ki and Tomi Kinnunen and Junichi Yamagishi", title = "Optimizing Tandem Speaker Verification and Anti-Spoofing Systems", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "477--488", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138681", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ni:2022:FUN, author = "Xin Ni and Jia Ren", title = "{FC-U2-Net}: a Novel Deep Neural Network for Singing Voice Separation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "489--494", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3140561", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zeghidour:2022:SEE, author = "Neil Zeghidour and Alejandro Luebs and Ahmed Omran and Jan Skoglund and Marco Tagliasacchi", title = "{SoundStream}: an End-to-End Neural Audio Codec", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "495--507", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3129994", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Manamperi:2022:DAS, author = "Wageesha Manamperi and Thushara D. Abhayapala and Jihui Zhang and Prasanga N. Samarasinghe", title = "Drone Audition: Sound Source Localization Using On-Board Microphones", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "508--519", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3140550", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2022:RLB, author = "Qian Li and Hao Peng and Jianxin Li and Jia Wu and Yuanxing Ning and Lihong Wang and Philip S. Yu and Zheng Wang", title = "Reinforcement Learning-Based Dialogue Guided Event Extraction to Exploit Argument Relations", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "520--533", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138670", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ruiz:2022:DCA, author = "Santiago Ruiz and Toon van Waterschoot and Marc Moonen", title = "Distributed Combined Acoustic Echo Cancellation and Noise Reduction in Wireless Acoustic Sensor and Actuator Networks", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "534--547", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3140548", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Grinewitschus:2022:HSA, author = "Lukas Grinewitschus and Peter Jung", title = "The Harmonic Shift Algorithm for Efficient Multi-Pitch Detection", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "548--561", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3129344", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lu:2022:EMS, author = "Ziyao Lu and Xiang Li and Yang Liu and Chulun Zhou and Jianwei Cui and Bin Wang and Min Zhang and Jinsong Su", title = "Exploring Multi-Stage Information Interactions for Multi-Source Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "562--570", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3120592", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2022:CJM, author = "Jingxuan Yang and Si Li and Sheng Gao and Jun Guo", title = "{CorefDPR}: a Joint Model for Coreference Resolution and Dropped Pronoun Recovery in {Chinese} Conversations", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "571--581", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3140545", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Atalay:2022:SDN, author = "Timu{\c{c}}in Berk Atalay and Z{\"u}hre S{\"u} G{\"u}l and Enzo {De Sena} and Zoran Cvetkovi{\'c} and H{\"u}seyin Hac{\i}habibo{\u{g}}lu", title = "Scattering Delay Network Simulator of Coupled Volume Acoustics", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "582--593", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3143697", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2022:AKL, author = "Yi Zhang and Lei Li and Yunfang Wu and Qi Su and Xu Sun", title = "Alleviating the Knowledge-Language Inconsistency: a Study for Deep Commonsense Knowledge", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "594--604", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138721", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tan:2022:NSF, author = "Ke Tan and Zhong-Qiu Wang and DeLiang Wang", title = "Neural Spectrospatial Filtering", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "605--621", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145319", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mao:2022:APT, author = "Qianren Mao and Jianxin Li and Chenghua Lin and Congwen Chen and Hao Peng and Lihong Wang and Philip S. Yu", title = "Adaptive Pre-Training and Collaborative Fine-Tuning: a Win-Win Strategy to Improve Review Analysis Tasks", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "622--634", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3140482", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cheng:2022:LCO, author = "Zifeng Cheng and Zhiwei Jiang and Yafeng Yin and Cong Wang and Qing Gu", title = "Learning to Classify Open Intent via Soft Labeling and Manifold Mixup", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "635--645", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145308", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{An:2022:DSS, author = "Xiaochun An and Frank K. Soong and Lei Xie", title = "Disentangling Style and Speaker Attributes for {TTS} Style Transfer", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "646--658", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145297", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2022:RED, author = "Zhuang Chen and Tieyun Qian", title = "Retrieve-and-Edit Domain Adaptation for {End2End} Aspect Based Sentiment Analysis", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "659--672", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3146052", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2022:CDS, author = "Jian Liu and Mengshi Yu and Yufeng Chen and Jinan Xu", title = "Cross-Domain Slot Filling as Machine Reading Comprehension: a New Perspective", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "673--685", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3140559", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2022:SSS, author = "Yongkang Liu and Qingbao Huang and Jing Li and Linzhang Mo and Yi Cai and Qing Li", title = "{SSAP}: Storylines and Sentiment Aware Pre-Trained Model for Story Ending Generation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "686--694", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145320", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2022:MCI, author = "Ying Zhou and Xuefeng Liang and Yu Gu and Yifei Yin and Longshan Yao", title = "Multi-Classifier Interactive Learning for Ambiguous Speech Emotion Recognition", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "695--705", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145287", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hoang:2022:MSE, author = "Poul Hoang and Jan Mark de Haan and Zheng-Hua Tan and Jesper Jensen", title = "Multichannel Speech Enhancement With Own Voice-Based Interfering Speech Suppression for Hearing Assistive Devices", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "706--720", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145294", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yu:2022:DDR, author = "Weijie Yu and Chen Xu and Jun Xu and Liang Pang and Ji-Rong Wen", title = "Distribution Distance Regularized Sequence Representation for Text Matching in Asymmetrical Domains", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "721--733", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145289", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2022:NCA, author = "Heming Wang and DeLiang Wang", title = "Neural Cascade Architecture With Triple-Domain Loss for Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "734--743", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138716", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{DeLucia:2022:GDE, author = "Riccardo R. {De Lucia} and Antonio Canclini and Fabio Antonacci and Augusto Sarti", title = "Group Dictionary Equivalent Source Method for Sparse Nearfield Acoustic Holography", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "744--757", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145316", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ma:2022:RNF, author = "Tong Ma and Ying Wei and Xin Lou", title = "Reconfigurable Nonuniform Filter Bank for Hearing Aid Systems", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "758--771", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3138713", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mingote:2022:ALF, author = "Victoria Mingote and Antonio Miguel and Dayana Ribas and Alfonso Ortega and Eduardo Lleida", title = "{aDCF} Loss Function for Deep Metric Learning in End-to-End Text-Dependent Speaker Verification Systems", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "772--784", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145307", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tu:2022:TLB, author = "Quansheng Tu and Huawei Chen", title = "Theoretical Lower Bounds on the Performance of the First-Order Differential Microphone Arrays With Sensor Imperfections", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "785--801", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145317", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2022:CTF, author = "Taihui Wang and Feiran Yang and Jun Yang", title = "Convolutive Transfer Function-Based Multichannel Nonnegative Matrix Factorization for Overdetermined Blind Source Separation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "802--815", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145304", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2022:HLH, author = "Yi Zhang and Guangyou Zhou and Zhiwen Xie and Jimmy Xiangji Huang", title = "{HGEN}: Learning Hierarchical Heterogeneous Graph Encoding for Math Word Problem Solving", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "816--828", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145314", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fonseca:2022:FOD, author = "Eduardo Fonseca and Xavier Favory and Jordi Pons and Frederic Font and Xavier Serra", title = "{FSD50K}: an Open Dataset of Human-Labeled Sound Events", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "829--852", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3133208", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lei:2022:MMS, author = "Yi Lei and Shan Yang and Xinsheng Wang and Lei Xie", title = "{MsEmoTTS}: Multi-Scale Emotion Transfer, Prediction, and Control for Emotional Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "853--864", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145293", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2022:NND, author = "Tao Wang and Ruibo Fu and Jiangyan Yi and Jianhua Tao and Zhengqi Wen", title = "{NeuralDPS}: Neural Deterministic Plus Stochastic Model With Multiband Excitation for Noise-Controllable Waveform Generation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "865--878", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3140480", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Stone:2022:ASV, author = "Simon Stone and Yingming Gao and Peter Birkholz", title = "Articulatory Synthesis of Vocalized {\tt /r/} Allophones in {German}", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "879--889", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3130969", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Serai:2022:HSR, author = "Prashant Serai and Vishal Sunder and Eric Fosler-Lussier", title = "Hallucination of Speech Recognition Errors With Sequence to Sequence Learning", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "890--900", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145313", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2022:MUE, author = "Bin Wu and Sakriani Sakti and Jinsong Zhang and Satoshi Nakamura", title = "Modeling Unsupervised Empirical Adaptation by {DPGMM} and {DPGMM-RNN} Hybrid Model to Extract Perceptual Features for Low-Resource {ASR}", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "901--916", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3150220", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2022:EFR, author = "Mi Zhang and Tieyun Qian and Bing Liu", title = "Exploit Feature and Relation Hierarchy for Relation Extraction", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "917--930", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3153256", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jiao:2022:EIE, author = "Wenxiang Jiao and Xing Wang and Shilin He and Zhaopeng Tu and Irwin King and Michael R. Lyu", title = "Exploiting Inactive Examples for Natural Language Generation With Data Rejuvenation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "931--943", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3153269", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tu:2022:AFL, author = "Youzhi Tu and Man-Wai Mak", title = "Aggregating Frame-Level Information in the Spectral Domain With Self-Attention for Speaker Embedding", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "944--957", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3153267", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tan:2022:DMB, author = "Zhixing Tan and Zeyuan Yang and Meng Zhang and Qun Liu and Maosong Sun and Yang Liu", title = "Dynamic Multi-Branch Layers for On-Device Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "958--967", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3153257", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lin:2022:MRL, author = "Weiwei Lin and Man-Wai Mak", title = "Mixture Representation Learning for Deep Speaker Embedding", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "968--978", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3153270", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhu:2022:ICN, author = "Peng Zhu and Dawei Cheng and Fangzhou Yang and Yifeng Luo and Dingjiang Huang and Weining Qian and Aoying Zhou", title = "Improving {Chinese} Named Entity Recognition by Large-Scale Syntactic Dependency Graph", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "979--991", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3153261", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liang:2022:MTD, author = "Xiaobo Liang and Lijun Wu and Juntao Li and Tao Qin and Min Zhang and Tie-Yan Liu", title = "Multi-Teacher Distillation With Single Model for Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "992--1002", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3153264", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2022:TAF, author = "Xiaofeng Chen and Guohua Wang and Haopeng Ren and Yi Cai and Ho-fung Leung and Tao Wang", title = "Task-Adaptive Feature Fusion for Generalized Few-Shot Relation Classification in an Open World Environment", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1003--1015", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3153254", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lin:2022:SNC, author = "Yu-Chen Lin and Cheng Yu and Yi-Te Hsu and Szu-Wei Fu and Yu Tsao and Tei-Wei Kuo", title = "{SEOFP-NET}: Compression and Acceleration of Deep Neural Networks for Speech Enhancement Using Sign-Exponent-Only Floating-Points", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1016--1031", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3133209", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/fparith.bib; https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nakatani:2022:SIV, author = "Tomohiro Nakatani and Rintaro Ikeshita and Keisuke Kinoshita and Hiroshi Sawada and Naoyuki Kamo and Shoko Araki", title = "Switching Independent Vector Analysis and its Extension to Blind and Spatially Guided Convolutional Beamforming Algorithms", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1032--1047", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3155271", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Geng:2022:MLT, author = "Jianhua Geng and Sifan Wang and Qinglai Liu and Xin Lou", title = "Multi-Level Time-Frequency Bins Selection for Direction of Arrival Estimation Using a Single Acoustic Vector Sensor", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1048--1060", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3155276", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2022:AMW, author = "Qinzhuo Wu and Qi Zhang and Xuanjing Huang", title = "Automatic Math Word Problem Generation With Topic-Expression Co-Attention Mechanism and Reinforcement Learning", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1061--1072", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3155284", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nigro:2022:MSA, author = "Michael Nigro and Sridhar Krishnan", title = "Multimodal System for Audio Scene Source Counting and Analysis", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1073--1082", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3156795", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Peng:2022:CSM, author = "Yishu Peng and Sheng Zhang and Jiashu Zhang and Wei Xing Zheng", title = "Combined-Sample Multiband-Structured Subband Filtering Algorithms", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1083--1092", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3156791", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hu:2022:NAS, author = "Shoukang Hu and Xurong Xie and Mingyu Cui and Jiajun Deng and Shansong Liu and Jianwei Yu and Mengzhe Geng and Xunying Liu and Helen Meng", title = "Neural Architecture Search for {LF-MMI} Trained Time Delay Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1093--1107", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3153253", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dang:2022:TBR, author = "Xudong Dang and Wen Ma and Emanu{\"e}l A. P. Habets and Hongyan Zhu", title = "{TDOA}-Based Robust Sound Source Localization With Sparse Regularization in Wireless Acoustic Sensor Networks", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1108--1123", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3153251", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gao:2022:SDM, author = "Shan Gao and Jing Lin and Xihong Wu and Tianshu Qu", title = "Sparse {DNN} Model for Frequency Expanding of Higher Order Ambisonics Encoding Process", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1124--1135", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3153266", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pepe:2022:DOP, author = "Giovanni Pepe and Leonardo Gabrielli and Stefano Squartini and Carlo Tripodi and Nicol{\`o} Strozzi", title = "Deep Optimization of Parametric {IIR} Filters for Audio Equalization", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1136--1149", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3155289", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lee:2022:NAF, author = "Moa Lee and Junmo Lee and Joon-Hyuk Chang", title = "Non-Autoregressive Fully Parallel Deep Convolutional Neural Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1150--1159", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3156797", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Barrett:2022:SRM, author = "Liam Barrett and Junchao Hu and Peter Howell", title = "Systematic Review of Machine Learning Approaches for Detecting Developmental Stuttering", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1160--1172", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3155295", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lee:2022:DCV, author = "Sang-Hoon Lee and Hyeong-Rae Noh and Woo-Jeoung Nam and Seong-Whan Lee", title = "Duration Controllable Voice Conversion via Phoneme-Based Information Bottleneck", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1173--1183", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3156757", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shao:2022:AGN, author = "Zhihong Shao and Zhongqin Wu and Minlie Huang", title = "{AdvExpander}: Generating Natural Language Adversarial Examples by Expanding Text", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1184--1196", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2021.3129339", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Devalraju:2022:MES, author = "Dhanunjaya Varma Devalraju and Padmanabhan Rajan", title = "Multiview Embeddings for Soundscape Classification", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1197--1206", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3153272", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2022:AAR, author = "Chengyu Wang and Suyang Dai and Yipeng Wang and Fei Yang and Minghui Qiu and Kehan Chen and Wei Zhou and Jun Huang", title = "{ARoBERT}: an {ASR} Robust Pre-Trained Language Model for Spoken Language Understanding", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1207--1218", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3153268", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ong:2022:AVB, author = "Jonah Ong and Ba Tuong Vo and Sven Nordholm and Ba-Ngu Vo and Diluka Moratuwage and Changbeom Shim", title = "Audio-Visual Based Online Multi-Source Separation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1219--1234", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3156758", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cui:2022:LAN, author = "Leyang Cui and Yafu Li and Yue Zhang", title = "Label Attention Network for Structured Prediction", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1235--1248", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3145311", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sutojo:2022:SMM, author = "Sarinah Sutojo and Tobias May and Steven van de Par", title = "Segmentation of Multitalker Mixtures Based on Local Feature Contrasts and Auditory Glimpses", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1249--1262", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3155285", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gao:2022:WLP, author = "Hao Gao and Xuelei Feng and Yong Shen", title = "Weighted Loudspeaker Placement Method for Sound Field Reproduction", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1263--1276", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3158187", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Huang:2022:KPM, author = "Gongping Huang and Jacob Benesty and Israel Cohen and Jingdong Chen", title = "{Kronecker} Product Multichannel Linear Filtering for Adaptive Weighted Prediction Error-Based Speech Dereverberation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1277--1289", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3161150", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sugimoto:2022:LLC, author = "Takehiro Sugimoto", title = "Loudness-Level-Chasing Algorithm for Multiformat Live Audio Production", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1290--1304", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3153262", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2022:DHT, author = "Junshuang Wu and Richong Zhang and Yongyi Mao and Jinpeng Huai", title = "Dealing With Hierarchical Types and Label Noise in Fine-Grained Entity Typing", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1305--1318", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3155281", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ragni:2022:ICE, author = "Anton Ragni and Mark J. F. Gales and Oliver Rose and Katherine M. Knill and Alexandros Kastanos and Qiujia Li and Preben M. Ness", title = "Increasing Context for Estimating Confidence Scores in Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1319--1329", year = "2022", CODEN = "????", DOI = "https://doi.org/10.1109/TASLP.2022.3161153", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Thu Apr 7 10:27:19 2022", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bai:2022:EES, author = "Zhongxin Bai and Jianyu Wang and Xiao-Lei Zhang and Jingdong Chen", title = "End-to-End Speaker Verification via Curriculum Bipartite Ranking Weighted Binary Cross-Entropy", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1330--1344", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3161155", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3161155", abstract = "End-to-end speaker verification achieves the verification through estimating directly the similarity score between a pair of utterances, which is formulated as a binary (i.e., target versus non-target) classification problem. Unlike the stage-wise method, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chuang:2022:ILA, author = "Shang-Yi Chuang and Hsin-Min Wang and Yu Tsao", title = "Improved {Lite} Audio-Visual Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1345--1359", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3153265", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3153265", abstract = "Numerous studies have investigated the effectiveness of audio-visual multimodal learning for speech enhancement (AVSE) tasks, seeking a solution that uses visual data as auxiliary and complementary input to reduce the noise of noisy speech signals. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cheng:2022:EUA, author = "Gaofeng Cheng and Haoran Miao and Runyan Yang and Keqi Deng and Yonghong Yan", title = "{ETEH}: Unified Attention-Based End-to-End {ASR} and {KWS} Architecture", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1360--1373", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3161159", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3161159", abstract = "Even though attention-based end-to-end (E2E) automatic speech recognition (ASR) models have been yielding state-of-the-art recognition accuracy, they still fall behind many of the ASR models deployed in the industry in some crucial functionalities such as \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pandey:2022:SAR, author = "Ashutosh Pandey and DeLiang Wang", title = "Self-Attending {RNN} for Speech Enhancement to Improve Cross-Corpus Generalization", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1374--1385", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3161143", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3161143", abstract = "Deep neural networks (DNNs) represent the mainstream methodology for supervised speech enhancement, primarily due to their capability to model complex functions using hierarchical representations. However, a recent study revealed that DNNs trained on a \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jin:2022:TTD, author = "Di Jin and Shuyang Gao and Seokhwan Kim and Yang Liu and Dilek Hakkani-T{\"u}r", title = "Towards Textual Out-of-Domain Detection Without In-Domain Labels", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1386--1395", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3162081", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3162081", abstract = "In many real-world settings, machine learning models need to identify user inputs that are out-of-domain (OOD) so as to avoid performing wrong actions. This work focuses on a challenging case of OOD detection, where no labels for in-domain data are \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mrinalini:2022:SSB, author = "K. Mrinalini and P. Vijayalakshmi and T. Nagarajan", title = "{SBSim}: a {Sentence-BERT} Similarity-Based Evaluation Metric for {Indian} Language Neural Machine Translation Systems", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1396--1406", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3161160", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3161160", abstract = "Machine translation (MT) outputs are widely scored using automatic evaluation metrics and human evaluation scores. The automatic evaluation metrics are expected to be easily computable and a reflection of human evaluation. Traditional string-based metrics \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2022:AST, author = "Changhong Wang and Emmanouil Benetos and Vincent Lostanlen and Elaine Chew", title = "Adaptive Scattering Transforms for Playing Technique Recognition", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1407--1421", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3156785", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3156785", abstract = "Playing techniques contain distinctive information about musical expressivity and interpretation. Yet, current research in music signal analysis suffers from a scarcity of computational models for playing techniques, especially in the context of live \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cai:2022:IVI, author = "Danwei Cai and Weiqing Wang and Ming Li", title = "Incorporating Visual Information in Audio Based Self-Supervised Speaker Recognition", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1422--1435", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3162078", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3162078", abstract = "The current success of deep learning largely benefits from the availability of large amount of labeled data. However, collecting a large-scale dataset with human annotation can be expensive and sometimes difficult. Self-supervised learning thus attracts \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Luo:2022:EAE, author = "Yu Luo and Lina Pu", title = "{EC-ANC}: Edge Case-Enhanced Active Noise Cancellation for True Wireless Stereo Earbuds", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1436--1447", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3164211", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3164211", abstract = "In this paper, we propose an edge case-enhanced active noise cancellation (EC-ANC) system that integrates a piezo microphone, a signal processor, and a wireless module into the charging case of TWS earbuds. Considering the fact that sound travels much \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2022:CSE, author = "Tao Li and Xinsheng Wang and Qicong Xie and Zhichao Wang and Lei Xie", title = "Cross-Speaker Emotion Disentangling and Transfer for End-to-End Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1448--1460", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3164181", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3164181", abstract = "The cross-speaker emotion transfer task in text-to-speech (TTS) synthesis particularly aims to synthesize speech for a target speaker with the emotion transferred from reference speech recorded by another (source) speaker. During the emotion transfer \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2022:RKN, author = "Yilin Zhao and Zhuosheng Zhang and Hai Zhao", title = "Reference Knowledgeable Network for Machine Reading Comprehension", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1461--1473", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3164219", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3164219", abstract = "Multi-choice Machine Reading Comprehension (MRC) as a challenge requires models to select the most appropriate answer from a set of candidates with a given passage and question. Most of the existing researches focus on the modeling of specific tasks or \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yu:2022:NAA, author = "Fu-Hao Yu and Kuan-Yu Chen and Ke-Han Lu", title = "Non-Autoregressive {ASR} Modeling Using Pre-Trained Language Models for {Chinese} Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1474--1482", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3166400", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3166400", abstract = "Transformer-based models have led to significant innovation in various classic and practical subjects, including speech processing, natural language processing, and computer vision. On top of the Transformer, attention-based end-to-end automatic speech \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cui:2022:TMR, author = "Yiming Cui and Ting Liu and Wanxiang Che and Zhigang Chen and Shijin Wang", title = "Teaching Machines to Read, Answer and Explain", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1483--1492", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3156789", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3156789", abstract = "With various Pre-trained Language Models (PLMs) blooming, Machine Reading Comprehension (MRC) systems have embraced significant improvements on various benchmarks and even surpassed human performances. However, most existing works only focus on the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Horiguchi:2022:EDB, author = "Shota Horiguchi and Yusuke Fujita and Shinji Watanabe and Yawen Xue and Paola Garc{\'\i}a", title = "Encoder-Decoder Based Attractors for End-to-End Neural Diarization", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1493--1507", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3162080", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3162080", abstract = "This paper investigates an end-to-end neural diarization (EEND) method for an unknown number of speakers. In contrast to the conventional cascaded approach to speaker diarization, EEND methods are better in terms of speaker overlap handling. However, EEND \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2022:DPM, author = "Chenda Li and Zhuo Chen and Yanmin Qian", title = "Dual-Path Modeling With Memory Embedding Model for Continuous Speech Separation", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1508--1520", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3165712", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3165712", abstract = "Continuous speech separation (CSS) aims at separating overlap-free targets from a long, partially-overlapped recording. Though it has shown promising results, the origin CSS framework does not consider cross-window information and long-span dependency. To \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tong:2022:SIU, author = "Yu Tong and Jingzhi Guo and Jizhe Zhou", title = "Separation Inference: a Unified Framework for Word Segmentation in {East} {Asian} Languages", journal = j-IEEE-ACM-TASLP, volume = "30", number = "??", pages = "1521--1530", year = "2022", DOI = "https://doi.org/10.1109/TASLP.2022.3161142", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:28:53 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3161142", abstract = "Existing methods consider Word Segmentation (WS) as sequence tagging. Each tag indicates the position of the current character in a segment. The exactness of the position for any non-boundaries character is unnecessary. Any incorrect inner prediction \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bhattacharjee:2023:CVO, author = "Mrinmoy Bhattacharjee and S. R. M. Prasanna and Prithwijit Guha", title = "Clean vs. Overlapped Speech-Music Detection Using Harmonic-Percussive Features and Multi-Task Learning", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1--10", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3164199", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3164199", abstract = "Detection of speech and music signals in isolated and overlapped conditions is an essential preprocessing step for many audio applications. Speech signals have \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Luo:2023:DSI, author = "Zhaojie Luo and Shoufeng Lin and Rui Liu and Jun Baba and Yuichiro Yoshikawa and Hiroshi Ishiguro", title = "Decoupling Speaker-Independent Emotions for Voice Conversion via Source-Filter Networks", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "11--24", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3190715", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3190715", abstract = "Emotional voice conversion (VC) aims to convert a neutral voice to an emotional one while retaining the linguistic information and speaker identity. We note that \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tian:2023:ILF, author = "Jinchuan Tian and Jianwei Yu and Chao Weng and Yuexian Zou and Dong Yu", title = "Integrating Lattice-Free {MMI} Into End-to-End Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "25--38", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3198555", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3198555", abstract = "In automatic speech recognition (ASR) research, discriminative criteria have achieved superior performance in DNN-HMM systems. Given this success, the \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shankar:2023:DFB, author = "Ravi Shankar and Hsi-Wei Hsieh and Nicolas Charon and Archana Venkataraman", title = "A Diffeomorphic Flow-Based Variational Framework for Multi-Speaker Emotion Conversion", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "39--53", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3209948", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3209948", abstract = "This paper introduces a new framework for non-parallel emotion conversion in speech. Our framework is based on two key contributions. First, we propose a \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zezario:2023:DLB, author = "Ryandhimas E. Zezario and Szu-Wei Fu and Fei Chen and Chiou-Shann Fuh and Hsin-Min Wang and Yu Tsao", title = "Deep Learning-Based Non-Intrusive Multi-Objective Speech Assessment Model With Cross-Domain Features", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "54--70", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3205757", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3205757", abstract = "This study proposes a cross-domain multi-objective speech assessment model, called MOSA-Net, which can simultaneously estimate the speech quality, \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qin:2023:RMC, author = "Xiaoyi Qin and Danwei Cai and Ming Li", title = "Robust Multi-Channel Far-Field Speaker Verification Under Different In-Domain Data Availability Scenarios", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "71--85", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3212834", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3212834", abstract = "The popularity and application of smart home devices have made far-field speaker verification an urgent need. However, speaker verification performance is \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mathad:2023:CVT, author = "Vikram C. Mathad and Julie M. Liss and Kathy Chapman and Nancy Scherer and Visar Berisha", title = "Consonant-Vowel Transition Models Based on Deep Learning for Objective Evaluation of Articulation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "86--95", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3209937", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3209937", abstract = "Spectro-temporal dynamics of consonant-vowel (CV) transition regions are considered to provide robust cues related to articulation. In this work, we propose an \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:FIA, author = "Li Li and Hirokazu Kameoka and Shoji Makino", title = "{FastMVAE2}: On Improving and Accelerating the Fast Variational Autoencoder-Based Source Separation Algorithm for Determined Mixtures", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "96--110", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3214763", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3214763", abstract = "This article proposes a new source model and training scheme to improve the accuracy and speed of the multichannel variational autoencoder (MVAE) method. The \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2023:MSG, author = "Jie Wang and Yan Yang and Keyu Liu and Zhiping Zhu and Xiaorong Liu", title = "{M3S}: Scene Graph Driven Multi-Granularity Multi-Task Learning for Multi-Modal {NER}", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "111--120", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221017", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221017", abstract = "Multi-modal Named Entity Recognition (MNER), which mainly focuses on enhancing text-only NER with visual information, has recently attracted considerable \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Delcroix:2023:STS, author = "Marc Delcroix and Jorge Bennasar Vazquez and Tsubasa Ochiai and Keisuke Kinoshita and Yasunori Ohishi and Shoko Araki", title = "{SoundBeam}: Target Sound Extraction Conditioned on Sound-Class Labels and Enrollment Clues for Increased Performance and Continuous Learning", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "121--136", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221000", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221000", abstract = "In many situations, we would like to hear desired sound events (SEs) while being able to ignore interference. Target sound extraction (TSE) tackles this \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Niizumi:2023:BAE, author = "Daisuke Niizumi and Daiki Takeuchi and Yasunori Ohishi and Noboru Harada and Kunio Kashino", title = "{BYOL} for Audio: Exploring Pre-Trained General-Purpose Audio Representations", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "137--151", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221007", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221007", abstract = "Pre-trained models are essential as feature extractors in modern machine learning systems in various domains. In this study, we hypothesize that representations \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2023:MWR, author = "Yingrui Xu and Hao Liu and Jingguo Ge and Xiaodan Zhang and Jingyuan Hu and Yulei Wu and Honglei Lv and Hongbin Shi and Wei Zhou", title = "Mining Weak Relations Between Reviews for Opinion Spam Detection", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "152--162", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221008", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221008", abstract = "Online reviews play a significant role in purchase decisions of consumers by providing feedback information from buyers of products. In order to mislead \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Masuyama:2023:OPR, author = "Yoshiki Masuyama and Kohei Yatabe and Kento Nagatomo and Yasuhiro Oikawa", title = "Online Phase Reconstruction via {DNN-Based} Phase Differences Estimation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "163--176", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221041", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221041", abstract = "This paper presents a two-stage online phase reconstruction framework using causal deep neural networks (DNNs). Phase reconstruction is a task of \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:TGT, author = "Jiang Liu and Donghong Ji and Jingye Li and Dongdong Xie and Chong Teng and Liang Zhao and Fei Li", title = "{TOE}: a Grid-Tagging Discontinuous {NER} Model Enhanced by Embedding {Tag\slash} Word Relations and More Fine-Grained Tags", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "177--187", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221009", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221009", abstract = "So far, discontinuous named entity recognition (NER) has received increasing research attention and many related methods have surged such as \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hu:2023:CDG, author = "Zhe Hu and Zhiwei Cao and Hou Pong Chan and Jiachen Liu and Xinyan Xiao and Jinsong Su and Hua Wu", title = "Controllable Dialogue Generation With Disentangled Multi-Grained Style Specification and Attribute Consistency Reward", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "188--199", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221002", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221002", abstract = "Controllable text generation is an appealing but challenging task, which allows users to specify particular attributes of the generated outputs. In this paper, we propose \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Abderrazek:2023:IDR, author = "Sondes Abderrazek and Corinne Fredouille and Alain Ghio and Muriel Lalain and Christine Meunier and Virginie Woisard", title = "Interpreting Deep Representations of Phonetic Features via Neuro-Based Concept Detector: Application to Speech Disorders Due to Head and Neck Cancer", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "200--214", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221039", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221039", abstract = "The popularity of Deep Neural Networks (DNNs) is growing significantly, and so is the interest in gaining a better understanding of their functioning. In this work, it is \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:EES, author = "Jie Zhang and Rui Tao and Jun Du and Li-Rong Dai", title = "Energy-Efficient Sparsity-Driven Speech Enhancement in Wireless Acoustic Sensor Networks", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "215--228", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221013", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221013", abstract = "Wireless acoustic sensor network (WASN) has shown a superiority over conventional microphone arrays in many aspects. There exists an important tradeoff \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2023:MVB, author = "Xianke Wang and Bowen Tian and Weiming Yang and Wei Xu and Wenqing Cheng", title = "{MusicYOLO}: a Vision-Based Framework for Automatic Singing Transcription", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "229--241", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221005", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221005", abstract = "Automatic singing transcription (AST), which refers to the process of inferring the onset, offset, and pitch from the singing audio, is of great significance in music \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:AAP, author = "Yuanyuan Liu and Mittapalle Kiran Reddy and Nelly Penttila and Tiina Ihalainen and Paavo Alku and Okko Rasanen", title = "Automatic Assessment of {Parkinson\&\#x0027;s} Disease Using Speech Representations of Phonation and Articulation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "242--255", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3212829", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3212829", abstract = "Speech from people with Parkinson\&\#x0027;s disease (PD) are likely to be degraded on phonation, articulation, and prosody. Motivated to describe \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sudholt:2023:PDN, author = "David Sudholt and Alec Wright and Cumhur Erkut and Vesa Valimaki", title = "Pruning Deep Neural Network Models of Guitar Distortion Effects", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "256--264", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3223257", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3223257", abstract = "Deep neural networks have been successfully used in the task of black-box modeling of analog audio effects such as distortion. Improving the processing speed \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jiao:2023:EMD, author = "Fangkai Jiao and Yangyang Guo and Minlie Huang and Liqiang Nie", title = "Enhanced Multi-Domain Dialogue State Tracker With Second-Order Slot Interactions", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "265--276", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221044", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221044", abstract = "Dialogue state tracking (DST) is often used to track the system\&\#x0027;s understanding of the user goal in task-oriented dialogue systems. \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tian:2023:SSS, author = "Hui Tian and Yiqin Qiu and Wojciech Mazurczyk and Haizhou Li and Zhenxing Qian", title = "{STFF-SM}: Steganalysis Model Based on Spatial and Temporal Feature Fusion for Speech Streams", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "277--289", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3224295", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3224295", abstract = "The real-time detection of speech steganography in Voice-over-Internet-Protocol (VoIP) scenarios remains an open problem, as it requires \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Singh:2023:ETM, author = "Gopendra Vikram Singh and Mauajama Firdaus and Asif Ekbal and Pushpak Bhattacharyya", title = "{EmoInt-Trans}: a Multimodal Transformer for Identifying Emotions and Intents in Social Conversations", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "290--300", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3224287", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3224287", abstract = "In the natural language processing community, open-domain conversational agents, also known as chatbots, are gaining popularity. One of the difficulties \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hu:2023:DSR, author = "De De Hu and Huaiwen Zhang and Feilong Bao and Rui Wang", title = "Distributed Sampling Rate Offset Estimation Over Acoustic Sensor Networks Based on Asynchronous Network {Newton} Optimization", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "301--312", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3224256", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3224256", abstract = "Sampling rate synchronization is an inevitable issue in distributed acoustic sensor networks. In this paper, an analytical sampling rate offset (SRO) \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Diaz-Guerra:2023:DAE, author = "David Diaz-Guerra and Antonio Miguel and Jose R. Beltran", title = "Direction of Arrival Estimation of Sound Sources Using Icosahedral {CNNs}", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "313--321", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3224282", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3224282", abstract = "In this paper, we present a new model for Direction of Arrival (DOA) estimation of sound sources based on an Icosahedral Convolutional Neural Network \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Guo:2023:CSF, author = "Peiming Guo and Shen Huang and Peijie Jiang and Yueheng Sun and Meishan Zhang and Min Zhang", title = "Curriculum-Style Fine-Grained Adaption for Unsupervised Cross-Lingual Dependency Transfer", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "322--332", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3224302", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3224302", abstract = "Unsupervised cross-lingual transfer has been shown great potentials for dependency parsing of the low-resource languages when there is no annotated treebank \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Desiraju:2023:JOE, author = "Naveen Kumar Desiraju and Simon Doclo and Markus Buck and Tobias Wolff", title = "Joint Online Estimation of Early and Late Residual Echo {PSD} for Residual Echo Suppression", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "333--344", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3224292", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3224292", abstract = "In hands-free telephony and other distant-talking applications, an acoustic echo cancellation system is typically required, where a short adaptive filter is \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sun:2023:MBW, author = "Guangzhi Sun and Chao Zhang and Philip C. Woodland", title = "Minimising Biasing Word Errors for Contextual {ASR} With the Tree-Constrained Pointer Generator", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "345--354", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3224286", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3224286", abstract = "Contextual knowledge is essential for reducing speech recognition errors on high-valued long-tail words. This paper proposes a novel tree-constrained pointer \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Casebeer:2023:MAM, author = "Jonah Casebeer and Nicholas J. Bryan and Paris Smaragdis", title = "{Meta-AF}: Meta-Learning for Adaptive Filters", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "355--370", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3224288", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3224288", abstract = "Adaptive filtering algorithms are pervasive throughout signal processing and have had a material impact on a wide variety of domains including audio \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fu:2023:CLN, author = "Yingwen Fu and Nankai Lin and Boyu Chen and Ziyu Yang and Shengyi Jiang", title = "Cross-Lingual Named Entity Recognition for Heterogeneous Languages", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "371--382", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3212698", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3212698", abstract = "Previous works on cross-lingual Named Entity Recognition (NER) have achieved great success. However, few of them consider the effect of language \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2023:TST, author = "Jun-You Wang and Jyh-Shing Roger Jang", title = "Training a Singing Transcription Model Using Connectionist Temporal Classification Loss and Cross-Entropy Loss", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "383--396", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3224297", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3224297", abstract = "In this paper, we propose a method that uses a combination of the Connectionist Temporal Classification (CTC) loss and the cross-entropy loss to train a note-level singing transcription model. By considering the task as predicting a note sequence of the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2023:SDN, author = "Zhong-Qiu Wang and Gordon Wichern and Shinji Watanabe and Jonathan Le Roux", title = "{STFT-Domain} Neural Speech Enhancement With Very Low Algorithmic Latency", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "397--410", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3224285", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3224285", abstract = "Deep learning based speech enhancement in the short-time Fourier transform (STFT) domain typically uses a large window length such as 32 ms. A larger window can lead to higher frequency resolution and potentially better enhancement. This however incurs an \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:NRR, author = "Yu Li and Bojie Hu and Jian Liu and Yufeng Chen and Jinan Xu", title = "A Neighborhood Re-Ranking Model With Relation Constraint for Knowledge Graph Completion", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "411--425", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3225537", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3225537", abstract = "Knowledge graph completion (KGC) aims to predict missing links based on observed triples. However, current KGC models are still limited by the following two aspects. (1) the entity semantics is implicitly learned by neural network and merely depends on \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Miaschi:2023:RSN, author = "Alessio Miaschi and Dominique Brunato and Felice Dell'Orletta and Giulia Venturi", title = "On Robustness and Sensitivity of a Neural Language Model: a Case Study on {Italian} {L1} Learner Errors", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "426--438", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3226333", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3226333", abstract = "In this paper, we propose a comprehensive linguistic study aimed at assessing the implicit behavior of one of the most prominent Neural Language Models (NLM) based on Transformer architectures, BERT Devlin et al., when dealing with a particular source of \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xiao:2023:TEP, author = "Rong Xiao and Yu Wan and Baosong Yang and Haibo Zhang and Huajin Tang and Derek F. Wong and Boxing Chen", title = "Towards Energy-Preserving Natural Language Understanding With Spiking Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "439--447", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221011", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221011", abstract = "Artificial neural networks have shown promising results in a variety of natural language understanding (NLU) tasks. Despite their successes, conventional neural-based NLU models are criticized for high energy consumption, making them laborious to be \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2023:SSB, author = "Juan Zhao and Tianrui Zong and Yong Xiang and Longxiang Gao and Guang Hua and Keshav Sood and Yushu Zhang", title = "{SSVS-SSVD} Based Desynchronization Attacks Resilient Watermarking Method for Stereo Signals", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "448--461", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3225668", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3225668", abstract = "Most of the audio signals in real-world applications are stereo signals. However, the previous desynchronization attacks resilient watermarking methods cannot preserve perceptual quality or achieve robustness when constrained by high embedding rates and \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:TFA, author = "Qiquan Zhang and Xinyuan Qian and Zhaoheng Ni and Aaron Nicolson and Eliathamby Ambikairajah and Haizhou Li", title = "A Time-Frequency Attention Module for Neural Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "462--475", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3225649", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3225649", abstract = "Speech enhancement plays an essential role in a wide range of speech processing applications. Recent studies on speech enhancement tend to investigate how to effectively capture the long-term contextual dependencies of speech signals to boost performance. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xie:2023:CAF, author = "Binhong Xie and Yu Li and Hongyan Zhao and Lihu Pan and Enhui Wang", title = "A Cross-Attention Fusion Based Graph Convolution Auto-Encoder for Open Relation Extraction", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "476--485", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3226680", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3226680", abstract = "Open Relation Extraction (OpenRE) aims at clustering relation instances to extract relation types. By learning relation patterns between named entities, it clusters semantically equivalent patterns into a unified relation cluster. Existing clustering-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hong:2023:GAI, author = "Qian-Bei Hong and Chung-Hsien Wu and Hsin-Min Wang", title = "Generalization Ability Improvement of Speaker Representation and Anti-Interference for Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "486--499", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221042", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221042", abstract = "The ability to generalize to mismatches between training and testing conditions and resist interference from other speakers is crucial for the performance of speaker verification. In this paper, we propose two novel approaches to improve the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lyu:2023:RHF, author = "Xinglin Lyu and Junhui Li and Min Zhang and Chenchen Ding and Hideki Tanaka and Masao Utiyama", title = "Refining History for Future-Aware Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "500--512", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3226332", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3226332", abstract = "Neural machine translation uses a decoder to generate target words auto-regressively by predicting the next target word conditioned on a given source sentence and its previously predicted target words, i.e, its translation history, which suffers from two \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2023:EEM, author = "Mou Wang and Junqi Chen and Xiao-Lei Zhang and Susanto Rahardja", title = "End-to-End Multi-Modal Speech Recognition on an Air and Bone Conducted Speech Corpus", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "513--524", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3224305", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3224305", abstract = "Automatic speech recognition (ASR) has been significantly improved in the past years. However, most robust ASR systems are based on air-conducted (AC) speech, and their performances in low signal-to-noise-ratio (SNR) conditions are not satisfactory. Bone-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zorrilla:2023:AEA, author = "Asier L{\'o}pez Zorrilla and Mar{\'\i}a In{\'e}s Torres and Heriberto Cuay{\'a}huitl", title = "Audio Embedding-Aware Dialogue Policy Learning", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "525--538", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3225658", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3225658", abstract = "Following the success of Natural Language Processing (NLP) transformers pretrained via self-supervised learning, similar models have been proposed recently for speech processing such as Wav2Vec2, HuBERT and UniSpeech-SAT. An interesting yet unexplored \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shang:2023:MMN, author = "Xichen Shang and Chuxin Chen and Zipeng Chen and Qianli Ma", title = "Modularized Mutuality Network for Emotion-Cause Pair Extraction", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "539--549", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3228129", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3228129", abstract = "Emotion-cause pair extraction (ECPE) is an emerging task born out of Emotion cause extraction (ECE), which aims to extract the emotion clause and the corresponding cause clause simultaneously. Previous methods decompose ECPE into multiple sub-tasks, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qian:2023:AVC, author = "Xinyuan Qian and Zhengdong Wang and Jiadong Wang and Guohui Guan and Haizhou Li", title = "Audio-Visual Cross-Attention Network for Robotic Speaker Tracking", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "550--562", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3226330", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3226330", abstract = "Audio-visual signals can be used jointly for robotic perception as they complement each other. Such multi-modal sensory fusion has a clear advantage, especially under noisy acoustic conditions. Speaker localization, as an essential robotic function, was \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tesch:2023:IDN, author = "Kristina Tesch and Timo Gerkmann", title = "Insights Into Deep Non-Linear Filters for Improved Multi-Channel Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "563--575", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221046", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221046", abstract = "The key advantage of using multiple microphones for speech enhancement is that spatial filtering can be used to complement the tempo-spectral processing. In a traditional setting, linear spatial filtering (beamforming) and single-channel post-filtering \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{vonNeumann:2023:SLC, author = "Thilo von Neumann and Keisuke Kinoshita and Christoph Boeddeker and Marc Delcroix and Reinhold Haeb-Umbach", title = "Segment-Less Continuous Speech Separation of Meetings: Training and Evaluation Criteria", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "576--589", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3228629", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3228629", abstract = "Continuous Speech Separation (CSS) has been proposed to address speech overlaps during the analysis of realistic meeting-like conversations by eliminating any overlaps before further processing. CSS separates a recording of arbitrarily many speakers into \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Albertini:2023:TSB, author = "Davide Albertini and Alberto Bernardini and Federico Borra and Fabio Antonacci and Augusto Sarti", title = "Two-Stage Beamforming With Arbitrary Planar Arrays of Differential Microphone Array Units", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "590--602", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3231719", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3231719", abstract = "Differential Microphone Arrays (DMAs) are of great interest in the literature on small-sized microphone arrays, due to their good directivity properties and nearly frequency-invariant spatial responses. Recently developed beamforming techniques combine \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2023:SSP, author = "Yi-Syuan Chen and Yun-Zhu Song and Hong-Han Shuai", title = "{SPEC}: Summary Preference Decomposition for Low-Resource Abstractive Summarization", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "603--618", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3230539", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3230539", abstract = "Neural abstractive summarization has been widely studied and achieved great success with large-scale corpora. However, the considerable cost of annotating data motivates the need for learning strategies under low-resource settings. In this paper, we \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xiao:2023:GHT, author = "Yingying Xiao and Shanmou Chen and Qiangqiang Zhang and Dongyuan Lin and Minglin Shen and Junhui Qian and Shiyuan Wang", title = "Generalized Hyperbolic Tangent Based Random {Fourier} Conjugate Gradient Filter for Nonlinear Active Noise Control", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "619--632", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3230545", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3230545", abstract = "The filtered-x least mean square (FxLMS) algorithm has been proposed for an active noise control (ANC) system. However, due to the used mean square error (MSE) criterion, FxLMS suffers from performance degeneration for non-Gaussian noises, dramatically. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qi:2023:ELR, author = "Jun Qi and Chao-Han Huck Yang and Pin-Yu Chen and Javier Tejedor", title = "Exploiting Low-Rank Tensor-Train Deep Neural Networks Based on {Riemannian} Gradient Descent With Illustrations of Speech Processing", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "633--642", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3231714", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3231714", abstract = "This work focuses on designing low-complexity hybrid tensor networks by considering trade-offs between the model complexity and practical performance. Firstly, we exploit a low-rank tensor-train deep neural network (TT-DNN) to build an end-to-end deep \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gu:2023:MSN, author = "Bin Gu and Wu Guo and Jie Zhang", title = "Memory Storable Network Based Feature Aggregation for Speaker Representation Learning", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "643--655", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3231709", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3231709", abstract = "Learning fixed-dimensional speaker representation using deep neural networks is a key step in speaker verification. In this work, we propose an auxiliary memory storable network (MSN) to assist a backbone network for learning discriminative features, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Abe:2023:AMM, author = "Takumi Abe and Shoichi Koyama and Natsuki Ueno and Hiroshi Saruwatari", title = "Amplitude Matching for Multizone Sound Field Control", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "656--669", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3231715", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3231715", abstract = "A multizone sound field control method, called amplitude matching, is proposed. The objective of amplitude matching is to synthesize a desired amplitude (or magnitude) distribution over a target region with multiple loudspeakers, whereas the phase \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Barhoush:2023:LDS, author = "Mahdi Barhoush and Ahmed Hallawa and Arne Peine and Lukas Martin and Anke Schmeink", title = "Localization-Driven Speech Enhancement in Noisy Multi-Speaker Hospital Environments Using Deep Learning and Meta Learning", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "670--683", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3231700", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3231700", abstract = "This work addresses the problem of 3D-localizing and enhancing the speech of one main speaker in noisy multi-speaker hospital environments using a multi-channel microphone array. In our model, we propose conducting speaker localization using a machine \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kamper:2023:WSD, author = "Herman Kamper", title = "Word Segmentation on Discovered Phone Units With Dynamic Programming and Self-Supervised Scoring", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "684--694", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3229264", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3229264", abstract = "Recent work on unsupervised speech segmentation has used self-supervised models with phone and word segmentation modules that are trained jointly. This paper instead revisits an older approach to word segmentation: bottom-up phone-like unit discovery is \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:JML, author = "Changheng Li and Jorge Martinez and Richard Christian Hendriks", title = "Joint Maximum Likelihood Estimation of Microphone Array Parameters for a Reverberant Single Source Scenario", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "695--705", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3231706", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3231706", abstract = "Estimation of the acoustic-scene related parameters such as relative transfer functions (RTFs) from source to microphones, source power spectral densities (PSDs) and PSDs of the late reverberation is essential and also challenging. Existing maximum \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Horiguchi:2023:OND, author = "Shota Horiguchi and Shinji Watanabe and Paola Garc{\'\i}a and Yuki Takashima and Yohei Kawaguchi", title = "Online Neural Diarization of Unlimited Numbers of Speakers Using Global and Local Attractors", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "706--720", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3233237", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3233237", abstract = "A method to perform offline and online speaker diarization for an unlimited number of speakers is described in this paper. End-to-end neural diarization (EEND) has achieved overlap-aware speaker diarization by formulating it as a multi-label \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{He:2023:WNA, author = "Ling He and Jia Fu and Yuanyuan Li and Xi Xiong and Jing Zhang", title = "{WNSA-Net}: an Axial-Attention-Based Network for Schizophrenia Detection Using Wideband and Narrowband Spectrograms", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "721--733", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3209941", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3209941", abstract = "Schizophrenia is a severe mental disease that affects patients\&\#x0027; thoughts, feelings, and behaviors. Speech signal has proven to be a biomarker in the early diagnosis of schizophrenia. Previous studies on schizophrenic speech detection are mainly \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Prakash:2023:ERL, author = "Anusha Prakash and Hema A. Murthy", title = "Exploring the Role of Language Families for Building Indic Speech Synthesisers", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "734--747", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3230453", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3230453", abstract = "Building end-to-end speech synthesisers for Indian languages is challenging, given the lack of adequate clean training data and multiple grapheme representations across languages. This work explores the importance of training multilingual and multi-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rohmatillah:2023:HRL, author = "Mahdin Rohmatillah and Jen-Tzung Chien", title = "Hierarchical Reinforcement Learning With Guidance for Multi-Domain Dialogue Policy", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "748--761", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3235202", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3235202", abstract = "Achieving high performance in a multi-domain dialogue system with low computation is undoubtedly challenging. Previous works applying an end-to-end approach have been very successful. However, the computational cost remains a major issue since the large-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ghorbani:2023:DEE, author = "Shahram Ghorbani and John H. L. Hansen", title = "Domain Expansion for End-to-End Speech Recognition: Applications for {Accent\slash} Dialect Speech", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "762--774", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3233238", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3233238", abstract = "Training Automatic Speech Recognition (ASR) systems with sequentially incoming data from alternate domains is an essential milestone in order to reach human intelligibility level in speech recognition. The main challenge of sequential learning is that \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2023:SHE, author = "Weidong Chen and Xiaofen Xing and Xiangmin Xu and Jianxin Pang and Lan Du", title = "{SpeechFormer++}: a Hierarchical Efficient Framework for Paralinguistic Speech Processing", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "775--788", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3235194", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3235194", abstract = "Paralinguistic speech processing is important in addressing many issues, such as sentiment and neurocognitive disorder analyses. Recently, Transformer has achieved remarkable success in the natural language processing field and has demonstrated its \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Holighaus:2023:GBD, author = "Nicki Holighaus and G{\"u}nther Koliander and Clara Hollomey and Friedrich Pillichshammer", title = "Grid-Based Decimation for Wavelet Transforms With Stably Invertible Implementation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "789--801", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3235197", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3235197", abstract = "The constant center frequency to bandwidth ratio (Q-factor) of wavelet transforms provides a very natural representation for audio data. However, invertible wavelet transforms have either required non-uniform decimation\&\#x2014;leading to irregular data \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lin:2023:RSV, author = "Weiwei Lin and Man-Wai Mak", title = "Robust Speaker Verification Using Deep Weight Space Ensemble", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "802--812", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3233231", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3233231", abstract = "Domain shift is one of the most challenging problems in speaker verification. Although numerous methods have been proposed to address domain shift, most approaches optimize the performance of one domain at the sacrifice of the other. As a result, to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:PDC, author = "Lin Zhang and Xin Wang and Erica Cooper and Nicholas Evans and Junichi Yamagishi", title = "The {PartialSpoof} Database and Countermeasures for the Detection of Short Fake Speech Segments Embedded in an Utterance", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "813--825", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3233236", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3233236", abstract = "Automatic speaker verification is susceptible to various manipulations and spoofing, such as text-to-speech synthesis, voice conversion, replay, tampering, adversarial attacks, and so on. We consider a new spoofing scenario called {$<$ italic$>$}\&\#x201C;Partial \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mei:2023:IBP, author = "Jie Mei and Yufan Wang and Xinhui Tu and Ming Dong and Tingting He", title = "Incorporating {BERT} With Probability-Aware Gate for Spoken Language Understanding", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "826--834", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3237156", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3237156", abstract = "Spoken language understanding (SLU) is an essential part of a task-oriented dialogue system, which mainly includes intent detection and slot filling. Some existing approaches obtain enhanced semantic representation by establishing the correlation between \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ochiai:2023:MBN, author = "Tsubasa Ochiai and Marc Delcroix and Tomohiro Nakatani and Shoko Araki", title = "Mask-Based Neural Beamforming for Moving Speakers With Self-Attention-Based Tracking", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "835--848", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3237172", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3237172", abstract = "Beamforming is a powerful tool designed to enhance speech signals from the direction of a target source. Computing the beamforming filter requires estimating spatial covariance matrices (SCMs) of the source and noise signals. Time-frequency masks are \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gu:2023:TUA, author = "Rongzhi Gu and Shi-Xiong Zhang and Yuexian Zou and Dong Yu", title = "Towards Unified All-Neural Beamforming for Time and Frequency Domain Speech Separation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "849--862", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3229261", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3229261", abstract = "Recently, frequency domain all-neural beamforming methods have achieved remarkable progress for multichannel speech separation. In parallel, the integration of time domain network structure and beamforming also gains significant attention. This study \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Masuda:2023:ISS, author = "Naotake Masuda and Daisuke Saito", title = "Improving Semi-Supervised Differentiable Synthesizer Sound Matching for Practical Applications", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "863--875", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3237161", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3237161", abstract = "While synthesizers have become commonplace in music production, many users find it difficult to control the parameters of a synthesizer to create a sound as they intended. In order to assist the user, the {$<$ italic$>$ sound} {matching$<$}/{italic$>$} task aims to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Loweimi:2023:MSA, author = "Erfan Loweimi and Zhengjun Yue and Peter Bell and Steve Renals and Zoran Cvetkovic", title = "Multi-Stream Acoustic Modelling Using Raw Real and Imaginary Parts of the {Fourier} Transform", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "876--890", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3237167", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3237167", abstract = "In this paper, we investigate multi-stream acoustic modelling using the raw real and imaginary parts of the Fourier transform of speech signals. Using the raw magnitude spectrum, or features derived from it, as a proxy for the real and imaginary parts \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Borgstrom:2023:GAC, author = "Bengt J. Borgstr{\"o}m", title = "A Generative Approach to Condition-Aware Score Calibration for Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "891--901", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3240663", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3240663", abstract = "In speaker verification, score calibration is employed to transform verification scores to log-likelihood ratios (LLRs) which are statistically interpretable. Conventional calibration techniques apply a global score transform. However, in condition-aware \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Martin-Morato:2023:SLS, author = "Irene Mart{\'\i}n-Morat{\'o} and Annamaria Mesaros", title = "Strong Labeling of Sound Events Using Crowdsourced Weak Labels and Annotator Competence Estimation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "902--914", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3233468", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3233468", abstract = "Crowdsourcing is a popular tool for collecting large amounts of annotated data, but the specific format of the strong labels necessary for sound event detection is not easily obtainable through crowdsourcing. In this work, we propose a novel annotation \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhu:2023:NVT, author = "Wenzhao Zhu and Lei Luo and Jinwei Sun and Mads Gr{\ae}sb{\o}ll Christensen", title = "A New Virtual Tracking Sub-Algorithm Based Hybrid Active Control System for Narrowband Noise With Impulsive Interference", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "915--926", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3240645", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3240645", abstract = "Mechanical noise is usually a mixture of narrowband and impulsive noise which needs complex active noise control (ANC) algorithms to improve the de-noising performance. But the ANC algorithm with a high computation load will reduce the real-time \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Deppisch:2023:DRS, author = "Thomas Deppisch and Sebasti{\`a} V. Amengual Gar{\'\i} and Paul Calamia and Jens Ahrens", title = "Direct and Residual Subspace Decomposition of Spatial Room Impulse Responses", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "927--942", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3240657", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3240657", abstract = "Psychoacoustic experiments have shown that directional properties of the direct sound, salient reflections, and the late reverberation of an acoustic room response can have a distinct influence on the auditory perception of a given room. Spatial room \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Moliner:2023:BGB, author = "Eloi Moliner and Vesa V{\"a}lim{\"a}ki", title = "{BEHM-GAN}: Bandwidth Extension of Historical Music Using Generative Adversarial Networks", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "943--956", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3190726", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3190726", abstract = "Audio bandwidth extension aims to expand the spectrum of bandlimited audio signals. Although this topic has been broadly studied during recent years, the particular problem of extending the bandwidth of historical music recordings remains an open \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jalmby:2023:LRR, author = "Martin J{\"a}lmby and Filip Elvander and Toon van Waterschoot", title = "Low-Rank Room Impulse Response Estimation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "957--969", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3240650", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3240650", abstract = "In this paper we consider low-rank estimation of room impulse responses (RIRs). Inspired by a physics-driven room-acoustical model, we propose an estimator of RIRs that promotes a low-rank structure for a matricization, or reshaping, of the estimated RIR. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:VLS, author = "Hong Liu and Yucheng Cai and Zhenru Lin and Zhijian Ou and Yi Huang and Junlan Feng", title = "Variational Latent-State {GPT} for Semi-Supervised Task-Oriented Dialog Systems", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "970--984", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3240661", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3240661", abstract = "Recently, two approaches, fine-tuning large pre-trained language models and variational training, have attracted significant interests, separately, for semi-supervised end-to-end task-oriented dialog (TOD) systems. In this paper, we propose Variational \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hu:2023:DSS, author = "De Hu and Qintuya Si and Rui Liu and Feilong Bao", title = "Distributed Sensor Selection for Speech Enhancement With Acoustic Sensor Networks", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "985--999", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3244525", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3244525", abstract = "In distributed acoustic sensor networks, only a few nodes make a significant contribution to speech enhancement tasks. Using these most informative nodes instead of the entire network not only avoids unnecessary energy consumption but also prolongs the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhu:2023:BSA, author = "Yingke Zhu and Brian Mak", title = "{Bayesian} Self-Attentive Speaker Embeddings for Text-Independent Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1000--1012", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3244502", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3244502", abstract = "Learning effective and discriminative speaker embeddings is a crucial task in speaker verification. Usually, speaker embeddings are extracted from a speaker-classification DNN that averages the hidden vectors over all the spoken frames of a speaker; the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:CTR, author = "Yuying Li and Yuchen Liu and Donald S. Williamson", title = "A Composite {T60} Regression and Classification Approach for Speech Dereverberation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1013--1023", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3245423", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3245423", abstract = "Dereverberation is often performed directly on the reverberant audio signal, without knowledge of the acoustic environment. Reverberation time, \ldots{}, however, is an essential \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:MGD, author = "Hanyi Zhang and Longbiao Wang and Kong Aik Lee and Meng Liu and Jianwu Dang and Helen Meng", title = "Meta-Generalization for Domain-Invariant Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1024--1036", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3244518", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3244518", abstract = "Automatic speaker verification (ASV) exhibits unsatisfactory performance under domain mismatch conditions owing to intrinsic and extrinsic factors, such as variations in speaking styles and recording devices encountered in real-world applications. To \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Niu:2023:QSQ, author = "Shu-Tong Niu and Jun Du and Lei Sun and Yu Hu and Chin-Hui Lee", title = "{QDM-SSD}: Quality-Aware Dynamic Masking for Separation-Based Speaker Diarization", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1037--1049", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3244513", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3244513", abstract = "We improve iterative separation-based speaker diarization (ISSD) with quality-aware dynamic masking (QDM). We call the proposed framework QDM-SSD. Compared with ISSD, QDM-SSD enhances the simulated data used for model adaptation through QDM to alleviate \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lyu:2023:HEH, author = "Boyang Lyu and Chunxiao Fan and Yue Ming and Panzi Zhao and Nannan Hu", title = "{En-HACN}: Enhancing Hybrid Architecture With Fast Attention and Capsule Network for End-to-end Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1050--1062", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3245407", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3245407", abstract = "Automatic speech recognition (ASR) is a fundamental technology in the field of artificial intelligence. End-to-end (E2E) ASR is favored for its state-of-the-art performance. However, E2E speech recognition still faces speech spatial information loss and \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:DFR, author = "Yang Liu and Haoqin Sun and Wenbo Guan and Yuqi Xia and Yongwei Li and Masashi Unoki and Zhen Zhao", title = "A Discriminative Feature Representation Method Based on Cascaded Attention Network With Adversarial Strategy for Speech Emotion Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1063--1074", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3245401", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3245401", abstract = "Currently, speech emotion recognition models still could not show satisfactory performance due to the complexity of emotions. In most of the previous studies, there is a common problem that some of the particular emotions are severely misclassified. In \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:IST, author = "Hao Zhang and Nianwen Si and Yaqi Chen and Wenlin Zhang and Xukui Yang and Dan Qu and Wei-Qiang Zhang", title = "Improving Speech Translation by Cross-Modal Multi-Grained Contrastive Learning", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1075--1086", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3244521", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3244521", abstract = "The end-to-end speech translation (E2E-ST) model has gradually become a mainstream paradigm due to its low latency and less error propagation. However, it is non-trivial to train such a model well due to the task complexity and data scarcity. The speech-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lin:2023:SML, author = "Wei-Cheng Lin and Carlos Busso", title = "Sequential Modeling by Leveraging Non-Uniform Distribution of Speech Emotion", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1087--1099", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3244527", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3244527", abstract = "The expression and perception of human emotions are not uniformly distributed over time. Therefore, tracking local changes of emotion within a segment can lead to better models for {$<$ italic$>$ speech} emotion {recognition$<$}/{italic$>$} (SER), even when the task is \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tripathi:2023:DDN, author = "Achyut Mani Tripathi and Om Jee Pandey", title = "Divide and Distill: New Outlooks on Knowledge Distillation for Environmental Sound Classification", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1100--1113", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3244507", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3244507", abstract = "Environmental sound classification (ESC) is an important research problem with a broad range of applications including audio-based surveillance, audio-visual systems, smart homes, and robotics, among others. The recently proposed vision multi-layer \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:LLA, author = "Hao Zhang and Ashutosh Pandey and De Liang Wang", title = "Low-Latency Active Noise Control Using Attentive Recurrent Network", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1114--1123", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3244528", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3244528", abstract = "Processing latency is a critical issue for active noise control (ANC) due to the causality constraint of ANC systems. This paper addresses low-latency ANC in the context of deep learning (i.e. deep ANC). A time-domain method using an attentive recurrent \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bross:2023:TBM, author = "Avital Bross and Sharon Gannot", title = "Training-Based Multiple Source Tracking Using Manifold-Learning and Recursive Expectation-Maximization", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1124--1140", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3245414", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3245414", abstract = "In this paper we propose a data-driven approach for multiple speaker tracking in reverberant enclosures. The speakers are uttering, possibly overlapping, speech signals while moving in the environment. The method comprises two stages. The first stage \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hu:2023:EPO, author = "Guimin Hu and Yi Zhao and Guangming Lu", title = "Emotion Prediction Oriented Method With Multiple Supervisions for Emotion-Cause Pair Extraction", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1141--1152", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3250833", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3250833", abstract = "Emotion-cause pair extraction (ECPE) task aims to extract all the pairs of emotions and their causes from an unannotated emotion text. The previous works usually extract the emotion-cause pairs from two perspectives of emotion and cause. However, emotion \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mohsenipour:2023:PCL, author = "Reza Mohsenipour and Daniel Massicotte and Wei-Ping Zhu", title = "{PI} Control of Loudspeakers Based on Linear Fractional Order Model", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1153--1162", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3250826", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3250826", abstract = "This paper aims at the proportional-integral (PI) control of the cone vibration of the electrodynamic loudspeakers system recently described using a linear fractional order model. After introducing the fractional order model of the circuit of these \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lubeck:2023:SUS, author = "Tim L{\"u}beck and Johannes M. Arend and Christoph P{\"o}rschmann", title = "Spatial Upsampling of Sparse Spherical Microphone Array Signals", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1163--1174", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3250841", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3250841", abstract = "We present a method for spatial upsampling of signals captured with spherical microphone arrays with a limited number of microphones. The upsampling is performed by adding virtual microphone signals using interpolation between the measured array signals. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Deng:2023:CSB, author = "Jiajun Deng and Xurong Xie and Tianzi Wang and Mingyu Cui and Boyang Xue and Zengrui Jin and Guinan Li and Shujie Hu and Xunying Liu", title = "Confidence Score Based Speaker Adaptation of Conformer Speech Recognition Systems", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1175--1190", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3250842", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3250842", abstract = "Speaker adaptation techniques provide a powerful solution to customise automatic speech recognition (ASR) systems for individual users. Practical application of unsupervised model-based speaker adaptation techniques to data intensive end-to-end ASR \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:CSN, author = "Hongsheng Zhang and Jizhang Gan and Ting Liu and Kui Huang and Hong Yang", title = "Coefficients-Switched Normalized Least-Mean- Squares Adaption in Echo Canceler of Sparse-Echo-Path", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1191--1199", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3250824", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3250824", abstract = "The Normalized Least-Mean-Squares (NLMS) algorithm commonly used in echo cancelers suffers from a number of limitations due to the existing sparsity in the echo path. Although some sparsity-aware algorithms have been proposed, the high computational \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Guizzo:2023:LSE, author = "Eric Guizzo and Tillman Weyde and Simone Scardapane and Danilo Comminiello", title = "Learning Speech Emotion Representations in the Quaternion Domain", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1200--1212", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3250840", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3250840", abstract = "The modeling of human emotion expression in speech signals is an important, yet challenging task. The high resource demand of speech emotion recognition models, combined with the general scarcity of emotion-labelled data are obstacles to the development \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bai:2023:KIR, author = "Jiaqi Bai and Ze Yang and Jian Yang and Hongcheng Guo and Zhoujun Li", title = "{KINet}: Incorporating Relevant Facts Into Knowledge-Grounded Dialog Generation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1213--1222", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3240654", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3240654", abstract = "Knowledge-grounded conversation has led to great progress in producing informative dialog responses by leveraging external knowledge. This work focuses on two affiliated knowledge grounded conversation tasks: {$<$ italic$>$Knowledge} {Selection$<$}/{italic$>$} and {$<$}. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2023:RSA, author = "Haiquan Zhao and Yuan Gao and Yingying Zhu", title = "Robust Subband Adaptive Filter Algorithms-Based Mixture Correntropy and Application to Acoustic Echo Cancellation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1223--1233", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3250845", ISSN = "2329-9290", ISSN-L = "2329-9290", bibdate = "Wed May 17 14:29:03 MDT 2023", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3250845", abstract = "To acquire an improvement of the performance of the subband adaptive filter with impulsive interference, the normalized subband adaptive filter (NSAF) algorithm-based maximum correntropy criterion (MCC), called MCC-NSAF, has been developed. However, it is \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:PPE, author = "Chen Zhang and Luis Fernando D'Haro and Qiquan Zhang and Thomas Friedrichs and Haizhou Li", title = "{PoE}: a Panel of Experts for Generalized Automatic Dialogue Assessment", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1234--1250", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3250825", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3250825", abstract = "Chatbots are expected to be knowledgeable across multiple domains, e.g. for daily chit-chat, exchange of information, and grounding in emotional situations. To effectively measure the quality of such conversational agents, a model-based automatic dialogue \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2023:FSD, author = "Qing Wang and Jun Du and Hua-Xin Wu and Jia Pan and Feng Ma and Chin-Hui Lee", title = "A Four-Stage Data Augmentation Approach to {ResNet-Conformer} Based Acoustic Modeling for Sound Event Localization and Detection", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1251--1264", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3256088", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3256088", abstract = "In this paper, we propose a novel four-stage data augmentation approach to ResNet-Conformer based acoustic modeling for sound event localization and detection (SELD). First, we explore two spatial augmentation techniques, namely audio channel swapping \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fu:2023:STD, author = "Yingwen Fu and Nankai Lin and Xiaohui Yu and Shengyi Jiang", title = "Self-Training With Double Selectors for Low-Resource Named Entity Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1265--1275", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3250828", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3250828", abstract = "Named Entity Recognition (NER) is fundamental to multiple downstream natural language processing (NLP) tasks, but most advanced NER methods heavily rely on massive labeled data with high cost. In this paper, we explore the effectiveness of self-training \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schulze-Forster:2023:UMS, author = "Kilian Schulze-Forster and Ga{\"e}l Richard and Liam Kelley and Clement S. J. Doire and Roland Badeau", title = "Unsupervised Music Source Separation Using Differentiable Parametric Source Models", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1276--1289", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3252272", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3252272", abstract = "Supervised deep learning approaches to underdetermined audio source separation achieve state-of-the-art performance but require a dataset of mixtures along with their corresponding isolated source signals. Such datasets can be extremely costly to obtain \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:SEC, author = "Yinggang Liu and Hong Fu and Ying Wei and Hanbing Zhang", title = "Sound Event Classification Based on Frequency-Energy Feature Representation and Two-Stage Data Dimension Reduction", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1290--1304", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3260708", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3260708", abstract = "The classification of environmental sound events is of great significance for applications such as machine hearing and acoustic surveillance. Feature representation and feature vector dimension directly affect system performance. To better extract \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Erdem:2023:PSR, author = "Ege Erdem and Zoran Cvetkovi{\'c} and H{\"u}seyin Hac{\i}habibo{\u{g}}lu", title = "{$3$D} Perceptual Soundfield Reconstruction via Virtual Microphone Synthesis", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1305--1317", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3260703", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3260703", abstract = "Perceptual soundfield reconstruction (PSR) is a multichannel audio recording and reproduction framework based on time-intensity panning in the horizontal plane. A practical limitation of PSR is that the optimal directivity patterns required by the system \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shi:2023:FDO, author = "Dongyuan Shi and Woon-Seng Gan and Bhan Lam and Xiaoyi Shen", title = "A Frequency-Domain Output-Constrained Active Noise Control Algorithm Based on an Intuitive Circulant Convolutional Penalty Factor", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1318--1332", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3260702", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3260702", abstract = "Due to their computational efficiency, least mean square (LMS)-based algorithms are still widely utilized to achieve optimal control in active noise control (ANC) applications. Real-world implementation of advanced ANC functionalities, such as \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ozturk:2023:SRS, author = "Muhammed Zahid Ozturk and Chenshu Wu and Beibei Wang and Min Wu and K. J. Ray Liu", title = "{RadioSES}: {mmWave}-Based Audioradio Speech Enhancement and Separation System", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1333--1347", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3250846", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3250846", abstract = "Speech enhancement and separation have been a long-standing problem, especially with the recent advances using a single microphone. Although microphones perform well in constrained settings, their performance for speech separation decreases in noisy \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:RVQ, author = "Jianwei Zhang and Julie Liss and Suren Jayasuriya and Visar Berisha", title = "Robust Vocal Quality Feature Embeddings for Dysphonic Voice Detection", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1348--1359", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3261753", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3261753", abstract = "Approximately 1.2\% of the world's population has impaired voice production. As a result, automatic dysphonic voice detection has attracted considerable academic and clinical interest. However, existing methods for automated voice assessment \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pandey:2023:ATN, author = "Ashutosh Pandey and DeLiang Wang", title = "Attentive Training: a New Training Framework for Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1360--1370", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3260711", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3260711", abstract = "Dealing with speech interference in a speech enhancement system requires either speaker separation or target speaker extraction. Speaker separation has multiple output streams with arbitrary assignments while target speaker extraction requires additional \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Inaguma:2023:AKD, author = "Hirofumi Inaguma and Tatsuya Kawahara", title = "Alignment Knowledge Distillation for Online Streaming Attention-Based Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1371--1385", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2021.3133217", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2021.3133217", abstract = "This article describes an efficient training method for online streaming attention-based encoder-decoder (AED) automatic speech recognition (ASR) systems. AED models have achieved competitive performance in offline scenarios by jointly optimizing all \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Reddy:2023:EBS, author = "Mittapalle Kiran Reddy and Paavo Alku", title = "Exemplar-Based Sparse Representations for Detection of {Parkinson}'s Disease From Speech", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1386--1396", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3260709", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3260709", abstract = "Parkinson's disease (PD) is a progressive neurological disorder which affects the motor system. The automatic detection of PD improves the diagnosis of the disease, and it can be done in a non-invasive manner from speech. In this paper, we \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kita:2023:SSL, author = "Shunsuke Kita and Yoshinobu Kajikawa", title = "Sound Source Localization Inside a Structure Under Semi-Supervised Conditions", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1397--1408", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3263776", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3263776", abstract = "We propose a method for applying a sound source localization (SSL) model trained on simulated data in a real-world environment, with a domain transfer (DT) model for the SSL inside a structure. The DT model transfers real data into pseudo-simulation data. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2023:PFH, author = "Guowei Wu and Shipei Liu and Xiaoya Fan", title = "The Power of Fragmentation: a Hierarchical Transformer Model for Structural Segmentation in Symbolic Music Generation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1409--1420", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3263797", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3263797", abstract = "Symbolic music generation relies on the contextual representation capabilities of the generative model, where the most prevalent approach is the Transformer-based model. Learning contextual representations are also related to the structural elements in \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Luo:2023:DMD, author = "Xueqin Luo and Gongping Huang and Jilu Jin and Jingdong Chen and Jacob Benesty and Wen Zhang and Mengyao Zhu and Chunjian Li", title = "Design of Maximum Directivity Beamformers With Linear Acoustic Vector Sensor Arrays", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1421--1435", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3256093", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3256093", abstract = "This paper studies the design of maximum directivity factor (MDF) beamformers based on uniform linear arrays (ULAs) consisting of acoustic vector sensors (AVSs). We first derive the main lobe constraints, which ensure that the beamformer's \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fan:2023:CAB, author = "Ruchao Fan and Wei Chu and Peng Chang and Abeer Alwan", title = "A {CTC} Alignment-Based Non-Autoregressive Transformer for End-to-End Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1436--1448", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3263789", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3263789", abstract = "Recently, end-to-end models have been widely used in automatic speech recognition (ASR) systems. Two of the most representative approaches are connectionist temporal classification (CTC) and attention-based encoder-decoder (AED) models. Autoregressive \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:DAN, author = "Tianyou Li and Siyuan Lian and Sipei Zhao and Jing Lu and Ian S. Burnett", title = "Distributed Active Noise Control Based on an Augmented Diffusion {FxLMS} Algorithm", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1449--1463", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3261742", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3261742", abstract = "Multichannel active noise control (ANC) systems have been widely investigated for low-frequency noise attenuation over a spatial region. Using a conventional centralized control strategy based on the multichannel filtered-\ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xie:2023:EPQ, author = "Jiayuan Xie and Wenhao Fang and Qingbao Huang and Yi Cai and Tao Wang", title = "Enhancing Paraphrase Question Generation With Prior Knowledge", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1464--1475", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221045", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221045", abstract = "Paraphrase question generation (PQG) aims to rewrite a given original question to a new paraphrase question, where the paraphrase question needs to have the same expressed meaning as the original question, but have a difference in expression form. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2023:IIM, author = "Chen Chen and Hansheng Hong and Jie Guo and Bin Song", title = "Inter- Intra Modal Representation Augmentation With Trimodal Collaborative Disentanglement Network for Multimodal Sentiment Analysis", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1476--1488", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3263801", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3263801", abstract = "Recently, Multimodal Sentiment Analysis (MSA) is a challenging research area given its complex nature, and humans express emotional cues across various modalities such as language, facial expressions, and speech. Representation and fusion of features are \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2023:GGF, author = "Jian Yang and Yuwei Yin and Liqun Yang and Shuming Ma and Haoyang Huang and Dongdong Zhang and Furu Wei and Zhoujun Li", title = "{GTrans}: Grouping and Fusing Transformer Layers for Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1489--1498", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3221040", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3221040", abstract = "Transformer structure, stacked by a sequence of encoder and decoder network layers, achieves significant development in neural machine translation. However, vanilla Transformer mainly exploits the top-layer representation, assuming the lower layers \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2023:GNL, author = "Xin Wu and Yi Cai and Zetao Lian and Ho-fung Leung and Tao Wang", title = "Generating Natural Language From Logic Expressions With Structural Representation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1499--1510", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3263784", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3263784", abstract = "Incorporating logic reasoning with deep neural networks (DNNs) is an important challenge in machine learning. In this article, we study the problem of converting logical expressions into natural language. In particular, given a sequential logic expression,. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:UST, author = "Yi Li and Yang Sun and Wenwu Wang and Syed Mohsen Naqvi", title = "U-Shaped Transformer With Frequency-Band Aware Attention for Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1511--1521", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3265839", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3265839", abstract = "Recently, Transformer shows the potential to exploit the long-range sequence dependency in speech with self-attention. It has been introduced in single channel speech enhancement to improve the accuracy of speech estimation from a noise mixture. However, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Antonanzas:2023:RMT, author = "Christian Anto{\~n}anzas and Miguel Ferrer and Maria de Diego and Alberto Gonzalez", title = "Remote Microphone Technique for Active Noise Control Over Distributed Networks", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1522--1535", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3264600", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3264600", abstract = "Multichannel Active Noise Control (ANC) headrest systems have usually been designed with the objective of creating quiet areas at the passenger positions within the cabin of a public transport. Due to the high computational demands of dealing with \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhu:2023:CDF, author = "Yi Zhu and Abhishek Tiwari and Jo{\~a}o Monteiro and Shruti Kshirsagar and Tiago Henrique Falk", title = "{COVID-19} Detection via Fusion of Modulation Spectrum and Linear Prediction Speech Features", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1536--1549", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3265603", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3265603", abstract = "The coronavirus disease 2019 (COVID-19) pandemic has drastically impacted life around the globe. As life returns to pre-pandemic routines, COVID-19 testing has become a key component, assuring that travellers and citizens are free from the disease. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:ESR, author = "Jijie Li and Kai Shuang and Jinyu Guo and Zengyi Shi and Hongman Wang", title = "Enhancing Semantic Relation Classification With Shortest Dependency Path Reasoning", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1550--1560", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3265205", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3265205", abstract = "Relation Classification (RC) is a basic and essential task of Natural Language Processing. Existing RC methods can be classified into two categories: sequence-based methods and dependency-based methods. Sequence-based methods identify the target relation \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{He:2023:AMM, author = "Mao-Kui He and Jun Du and Qing-Feng Liu and Chin-Hui Lee", title = "{ANSD-MA-MSE}: Adaptive Neural Speaker Diarization Using Memory-Aware Multi-Speaker Embedding", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1561--1573", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3265199", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3265199", abstract = "In this paper, we propose a neural speaker diarization (NSD) network architecture consisting of three key components. First, a memory-aware multi-speaker embedding (MA-MSE) mechanism is proposed to facilitate a dynamical refinement of speaker embedding to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2023:DFB, author = "Longting Xu and Jichen Yang and Chang Huai You and Xinyuan Qian and Daiyu Huang", title = "Device Features Based on Linear Transformation With Parallel Training Data for Replay Speech Detection", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1574--1586", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3267610", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3267610", abstract = "Replay speech poses a growing threat to speaker verification systems, thus the detection of replay speech becomes increasingly important. A critical factor differentiating replay speech and genuine speech is the representation of device information. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fang:2023:IUN, author = "Huajian Fang and Dennis Becker and Stefan Wermter and Timo Gerkmann", title = "Integrating Uncertainty Into Neural Network-Based Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1587--1600", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3265202", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3265202", abstract = "Supervised masking approaches in the time-frequency domain aim to employ deep neural networks to estimate a multiplicative mask to extract clean speech. This leads to a single estimate for each input without any guarantees or measures of reliability. In \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qin:2023:MPT, author = "Libo Qin and Xiao Xu and Lehan Wang and Yue Zhang and Wanxiang Che", title = "Modularized Pre-Training for End-to-End Task-Oriented Dialogue", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1601--1610", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3244503", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3244503", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:LDR, author = "Hanlei Zhang and Hua Xu and Shaojie Zhao and Qianrui Zhou", title = "Learning Discriminative Representations and Decision Boundaries for Open Intent Detection", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1611--1623", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3265203", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3265203", abstract = "Open intent detection is a significant problem in natural language understanding, which aims to identify the unseen open intent while ensuring known intent identification performance. However, current methods face two major challenges. Firstly, they \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bao:2023:GCR, author = "Guangsheng Bao and Yue Zhang", title = "A General Contextualized Rewriting Framework for Text Summarization", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1624--1635", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3268569", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3268569", abstract = "The rewriting method for text summarization combines the advantage of extractive and abstractive approaches, improving the conciseness and readability of extractive summaries. Exiting rewriting systems take extractive sentences as the only input and \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kirsch:2023:UFA, author = "Christoph Kirsch and Stephan D. Ewert", title = "A Universal Filter Approximation of Edge Diffraction for Geometrical Acoustics", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1636--1651", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3264737", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3264737", abstract = "Sound propagation in urban and indoor environments often involves diffraction at corners, finite objects and openings, resulting in perceptually relevant frequency-dependent attenuation. Geometrical acoustics (GA) has become a de-facto standard for the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Goli:2023:DLB, author = "Peyman Goli and Steven van de Par", title = "Deep Learning-Based Speech Specific Source Localization by Using Binaural and Monaural Microphone Arrays in Hearing Aids", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1652--1666", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3268734", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3268734", abstract = "A deep learning-based method is proposed for jointly detecting and localizing speech sources in a complex acoustic scene by using microphones of a hearing aid. Motivated by the human auditory system, peripheral preprocessing is applied on the microphone \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Thien:2023:IFP, author = "Nguyen Binh Thien and Yukoh Wakabayashi and Kenta Iwai and Takanobu Nishiura", title = "Inter-Frequency Phase Difference for Phase Reconstruction Using Deep Neural Networks and Maximum Likelihood", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1667--1680", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3268577", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3268577", abstract = "This paper presents improvements to two-stage algorithms for estimating the short-time Fourier transform (STFT) phase from only the amplitude by using deep neural networks (DNNs). The phase is difficult to reconstruct due to its sensitivity to the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chetupalli:2023:SCS, author = "Srikanth Raj Chetupalli and Emanu{\"e}l A. P. Habets", title = "Speaker Counting and Separation From Single-Channel Noisy Mixtures", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1681--1692", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3268572", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3268572", abstract = "We address the problem of speaker counting and separation from a noisy, single-channel, multi-source, recording. Most of the works in the literature assume mixtures containing two to five speakers. In this work, we consider noisy speech mixtures with one \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:ITR, author = "Guangyan Zhang and Ying Qin and Wenjie Zhang and Jialun Wu and Mei Li and Yutao Gai and Feijun Jiang and Tan Lee", title = "{iEmoTTS}: Toward Robust Cross-Speaker Emotion Transfer and Control for Speech Synthesis Based on Disentanglement Between Prosody and Timbre", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1693--1705", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3268571", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3268571", abstract = "Cross- speaker emotion transfer is a common approach to generating emotional speech when speech data with emotion labels from target speakers is not available. This paper presents a novel cross-speaker emotion transfer system named iEmoTTS. The system is \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tao:2023:SST, author = "Ruijie Tao and Kong Aik Lee and Rohan Kumar Das and Ville Hautam{\"a}ki and Haizhou Li", title = "Self-Supervised Training of Speaker Encoder With Multi-Modal Diverse Positive Pairs", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1706--1719", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3268568", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3268568", abstract = "We study a novel neural speaker encoder and its training strategies for speaker recognition without using any identity labels. The speaker encoder is trained to extract a fixed dimensional speaker embedding from a spoken utterance of variable length. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2023:DDD, author = "Dongchao Yang and Jianwei Yu and Helin Wang and Wen Wang and Chao Weng and Yuexian Zou and Dong Yu", title = "Diffsound: Discrete Diffusion Model for Text-to-Sound Generation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1720--1733", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3268730", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3268730", abstract = "Generating sound effects that people want is an important topic. However, there are limited studies in this area for sound generation. In this study, we investigate generating sound conditioned on a text prompt and propose a novel text-to-sound generation \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Krug:2023:AVL, author = "Paul Konstantin Krug and Peter Birkholz and Branislav Gerazov and Daniel Rudolph van Niekerk and Anqi Xu and Yi Xu", title = "Artificial Vocal Learning Guided by Phoneme Recognition and Visual Information", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1734--1744", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3264454", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3264454", abstract = "This paper introduces a paradigm shift regarding vocal learning simulations, in which the communicative function of speech acquisition determines the learning process and intelligibility is considered the primary measure of learning success. Thereby, a \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hong:2023:DRP, author = "Qian-Bei Hong and Chung-Hsien Wu and Hsin-Min Wang", title = "Decomposition and Reorganization of Phonetic Information for Speaker Embedding Learning", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1745--1757", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3267833", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3267833", abstract = "Speech content is closely related to the stability of speaker embeddings in speaker verification tasks. In this paper, we propose a novel architecture based on self-constraint learning (SCL) and reconstruction task (RT) to remove the influence of phonetic \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jiang:2023:SEI, author = "Wenbin Jiang and Kai Yu", title = "Speech Enhancement With Integration of Neural Homomorphic Synthesis and Spectral Masking", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1758--1770", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3271151", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3271151", abstract = "Speech enhancement refers to suppressing the background noise to improve the perceptual quality and intelligibility of the observed noisy speech. Recently, speech enhancement algorithms based on deep neural networks (DNNs) have replaced traditional \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:MLS, author = "Shu'ang Li and Xuming Hu and Li Lin and Aiwei Liu and Lijie Wen and Philip S. Yu", title = "A Multi-Level Supervised Contrastive Learning Framework for Low-Resource Natural Language Inference", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1771--1783", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3270771", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3270771", abstract = "Natural Language Inference (NLI) is a growingly essential task in natural language understanding, which requires inferring the relationship between the sentence pairs \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zheng:2023:BCE, author = "Xiaoqing Zheng", title = "Building Conventional {``Experts''} With a Dialogue Logic Programming Language", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1784--1796", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3271119", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3271119", abstract = "We describe DiaProlog, a dialogue logic programming language that extends the vanilla Prolog with the features to facilitate the integration of reasoning capabilities into task-oriented dialogue systems. The extended language combines the expressive power \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lin:2023:TOD, author = "Haitao Lin and Junnan Zhu and Lu Xiang and Feifei Zhai and Yu Zhou and Jiajun Zhang and Chengqing Zong", title = "Topic-Oriented Dialogue Summarization", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1797--1810", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3271118", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3271118", abstract = "A multi-turn dialogue often contains multiple discussion topics. In several scenarios (e.g., customer service dispute, public opinion monitoring), people are only interested in the gist of a specific topic in the dialogue. Therefore, we propose a novel \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Guo:2023:MTM, author = "Haohan Guo and Fenglong Xie and Xixin Wu and Frank K. Soong and Helen Meng", title = "{MSMC-TTS}: Multi-Stage Multi-Codebook {VQ-VAE} Based Neural {TTS}", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1811--1824", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3272470", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3272470", abstract = "This article aims to improve neural TTS with vector-quantized, compact speech representations. We propose a Vector-Quantized Variational AutoEncoder (VQ-VAE) based feature analyzer to encode acoustic features into sequences with different time resolutions,. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:DFN, author = "Bei Liu and Zhengyang Chen and Yanmin Qian", title = "Depth-First Neural Architecture With Attentive Feature Fusion for Efficient Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1825--1838", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3273417", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3273417", abstract = "Deep speaker embedding learning based on neural networks has become the predominant approach in speaker verification (SV) currently. In prior studies, researchers have investigated various network architectures. However, rare works pay attention to the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ghosh:2023:BCI, author = "Ria Ghosh and John H. L. Hansen", title = "Bilateral Cochlear Implant Processing of Coding Strategies With {CCi-MOBILE}, an Open-Source Research Platform", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1839--1850", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3267608", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3267608", abstract = "While speech understanding for cochlear implant (CI) users in quiet is relatively effective, listeners experience difficulty in identification of speaker and sound location. To assist for better residual hearing abilities and speech intelligibility \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2023:DND, author = "Aolong Zhou and Wen Zhang and Guojun Xu and Xiaoyong Li and Kefeng Deng and Junqiang Song", title = "{DBSA-Net}: Dual Branch Self-Attention Network for Underwater Acoustic Signal Denoising", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1851--1865", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3275030", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3275030", abstract = "Underwater acoustic signal denoising is a challenging task due to the complexity of the underwater environment. Most of the existing methods cannot effectively cope with the problem of underwater acoustic signal (UWAS) denoising at low signal-to-noise \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lin:2023:MAM, author = "Weiwei Lin and Man-Wai Mak", title = "Model-Agnostic Meta-Learning for Fast Text-Dependent Speaker Embedding Adaptation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1866--1876", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3275029", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3275029", abstract = "By constraining the lexical content of input speech, text-dependent speaker verification (TD-SV) offers more reliable performance than text-independent speaker verification (TI-SV) when dealing with short utterances. Because speech with constrained \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Galassi:2023:MTA, author = "Andrea Galassi and Marco Lippi and Paolo Torroni", title = "Multi-Task Attentive Residual Networks for Argument Mining", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1877--1892", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3275040", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3275040", abstract = "We explore the use of residual networks and neural attention for multiple argument mining tasks. We propose a residual architecture that exploits attention, multi-task learning, and makes use of ensemble, without any assumption on document or argument \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Luo:2023:MSS, author = "Yi Luo and Jianwei Yu", title = "Music Source Separation With Band-Split {RNN}", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1893--1901", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3271145", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3271145", abstract = "The performance of music source separation (MSS) models has been greatly improved in recent years thanks to the development of novel neural network architectures and training pipelines. However, recent model designs for MSS were mainly motivated by other \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Matsubara:2023:HNF, author = "Keisuke Matsubara and Takuma Okamoto and Ryoichi Takashima and Tetsuya Takiguchi and Tomoki Toda and Hisashi Kawai", title = "Harmonic-Net: Fundamental Frequency and Speech Rate Controllable Fast Neural Vocoder", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1902--1915", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3275032", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3275032", abstract = "There is a need to improve the synthesis quality of HiFi-GAN-based real-time neural speech waveform generative models on CPUs while preserving the controllability of fundamental frequency \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2023:OCL, author = "Yi Zhou and Zhizheng Wu and Xiaohai Tian and Haizhou Li", title = "Optimization of Cross-Lingual Voice Conversion With Linguistics Losses to Reduce Foreign Accents", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1916--1926", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3271107", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3271107", abstract = "Cross- lingual voice conversion (XVC) transforms the speaker identity of a source speaker to that of a target speaker who speaks a different language. Due to the intrinsic differences between languages, the converted speech may carry an unwanted foreign \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhu:2023:JSE, author = "Qiu-Shi Zhu and Jie Zhang and Zi-Qiang Zhang and Li-Rong Dai", title = "A Joint Speech Enhancement and Self-Supervised Representation Learning Framework for Noise-Robust Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1927--1939", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3275033", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3275033", abstract = "Though speech enhancement (SE) can be used to improve speech quality in noisy environments, it may also cause distortions that degrade the performance of automatic speech recognition (ASR) models. Self-supervised pre-training, on the other hand, has been \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sun:2023:IST, author = "Siqi Sun and Korin Richmond and Hao Tang", title = "Improving {Seq2Seq} {TTS} Frontends With Transcribed Speech Audio", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1940--1952", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3273414", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3273414", abstract = "Due to the data inefficiency and low speech quality of grapheme-based end-to-end text-to-speech (TTS), having a separate high-performance TTS linguistic frontend is still commonly regarded as necessary. However, a TTS frontend is itself difficult to build \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2023:MFS, author = "Shih-Lun Wu and Yi-Hsuan Yang", title = "{MuseMorphose}: Full-Song and Fine-Grained Piano Music Style Transfer With One Transformer {VAE}", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1953--1967", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3270726", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3270726", abstract = "Transformers and variational autoencoders (VAE) have been extensively employed for symbolic (e.g., MIDI) domain music generation. While the former boast an impressive capability in modeling long sequences, the latter allow users to willingly exert control \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gao:2023:PIF, author = "Xiaoxue Gao and Chitralekha Gupta and Haizhou Li", title = "{PoLyScriber}: Integrated Fine-Tuning of Extractor and Lyrics Transcriber for Polyphonic Music", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1968--1981", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3275036", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3275036", abstract = "Lyrics transcription of polyphonic music is challenging as the background music affects lyrics intelligibility. Typically, lyrics transcription can be performed by a two-step pipeline, i.e. a singing vocal extraction front end, followed by a lyrics \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lian:2023:PAP, author = "Zhicheng Lian and Haonan Cheng and Jiawan Zhang", title = "{PQG-A2SA}: Performance Quantification Guided Audio-to-Score Alignment for Orchestral Music", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1982--1992", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3277290", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3277290", abstract = "Audio- to-score alignment is a multi-modal task that aims at generating an accurate mapping between symbolic and signal-level representations of musical signals, which is important for music performance analysis and retrieval. Among numerous music genres, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ni:2023:SPA, author = "Jingen Ni and Ningning Zhang and Haofen Li", title = "Sparsity-Promoting Affine Projection Algorithm With Periodically-Updated Gain Matrix and Its Performance Analysis", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "1993--2003", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3277289", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3277289", abstract = "Sparse system identification is often encountered in applications such as network and acoustic echo cancellation. This work applies the sparsity promoting method to the affine projection algorithm (APA) to develop a sparsity-promoting APA (SAPA). To \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Das:2023:GFD, author = "Orchisama Das and Sebastian J. Schlecht and Enzo {De Sena}", title = "Grouped Feedback Delay Networks With Frequency-Dependent Coupling", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2004--2015", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3277368", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3277368", abstract = "Feedback Delay Networks are one of the most popular and efficient means of generating artificial reverberation. Recently, we proposed the Grouped Feedback Delay Network (GFDN), which couples multiple FDNs while maintaining system stability. The GFDN can \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2023:DDM, author = "Xudong Zhao and Gongping Huang and Jingdong Chen and Jacob Benesty", title = "Design of {$2$D} and {$3$D} Differential Microphone Arrays With a Multistage Framework", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2016--2031", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3278182", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3278182", abstract = "Differential microphone arrays (DMAs) have demonstrated a great potential for high-fidelity acoustic and speech signal acquisition in a wide range of applications since such arrays are able to achieve frequency-invariant beampatterns with high \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hsu:2023:ERG, author = "Jia-Hao Hsu and Jeremy Chang and Min-Hsueh Kuo and Chung-Hsien Wu", title = "Empathetic Response Generation Based on Plug-and-Play Mechanism With Empathy Perturbation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2032--2042", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3277274", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3277274", abstract = "Spoken dialogue systems have rapidly developed but are often viewed as inhumane because they lack empathetic communication skills. In this study, a transformer-based language model (DialoGPT fine-tuned on the EmpatheticDialogues dataset) was combined with \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dutt:2023:WMA, author = "Aditya Dutt and Paul Gader", title = "Wavelet Multiresolution Analysis Based Speech Emotion Recognition System Using {$1$D} {CNN LSTM} Networks", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2043--2054", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3277291", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3277291", abstract = "Speech Emotion Recognition (SER) is the task of recognizing a speaker's emotional state from speech. SER plays a significant role in Human-Computer Interaction and psychological assessment. Several kinds of time-frequency representations like \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Morales:2023:GAE, author = "Arturo Morales and Juan I. Yuz and Juan P. Cort{\'e}s and Javier G. Fontanet and Mat{\'\i}as Za{\~n}artu", title = "Glottal Airflow Estimation Using Neck Surface Acceleration and Low-Order {Kalman} Smoothing", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2055--2066", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3277269", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3277269", abstract = "The use of non-invasive skin accelerometers placed over the extrathoracic trachea has been proposed in the literature for measuring vocal function. Glottal airflow is estimated using inverse filtering or Bayesian techniques based on a subglottal impedance-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hosoda:2023:CDP, author = "Yuya Hosoda and Arata Kawamura and Youji Iiguni", title = "Complex-Domain Pitch Estimation Algorithm for Narrowband Speech Signals", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2067--2078", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3278488", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3278488", abstract = "We propose a complex-domain pitch estimation algorithm for narrowband speech signals, which utilizes a complex spectrum containing both amplitude and phase spectrum information. Traditional frequency-domain pitch estimation algorithms assume that a speech \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:AEB, author = "Zhidong Liu and Junhui Li and Muhua Zhu", title = "Alleviating Exposure Bias for Neural Machine Translation via Contextual Augmentation and Self Distillation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2079--2089", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3277245", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3277245", abstract = "In neural machine translation (NMT), most sequence-to-sequence (seq2seq) models are trained only with the teacher-forcing paradigm, where the ground truth history is used to predict the next ground truth word. At the inference stage, however, the decoder \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Beit-On:2023:WFS, author = "Hanan Beit-On and Tom Shlomo and Boaz Rafaely", title = "Weighted Frequency Smoothing for Enhanced Speaker Localization", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2090--2099", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3277270", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3277270", abstract = "The coherent signal subspace method may be used in order to apply subspace localization methods (e.g. MUSIC) to coherent sources. This method involves a focusing process followed by frequency smoothing, which is intended to decorrelate source signals from \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gao:2023:PMB, author = "Shan Gao and Xihong Wu and Tianshu Qu", title = "A Physical Model-Based Self-Supervised Learning Method for Signal Enhancement Under Reverberant Environment", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2100--2110", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3277246", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3277246", abstract = "In a reverberant environment, interferences such as reflections and background noise can degrade the perception of the sound source signal. Although the DNN-based methods have made a tremendous breakthrough in addressing this issue, the performance of \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jiang:2023:LDP, author = "Xue Jiang and Xiulian Peng and Huaying Xue and Yuan Zhang and Yan Lu", title = "Latent-Domain Predictive Neural Speech Coding", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2111--2123", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3277693", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3277693", abstract = "Neural audio/speech coding has recently demonstrated its capability to deliver high quality at much lower bitrates than traditional methods. However, existing neural audio/speech codecs employ either acoustic features or learned blind features with a \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Deng:2023:LFS, author = "Shumin Deng and Jiacheng Yang and Hongbin Ye and Chuanqi Tan and Mosha Chen and Songfang Huang and Fei Huang and Huajun Chen and Ningyu Zhang", title = "{LOGEN}: Few-Shot Logical Knowledge-Conditioned Text Generation With Self-Training", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2124--2133", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3275028", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3275028", abstract = "Natural language generation from structured data mainly focuses on surface-level descriptions, suffering from uncontrollable content selection and low fidelity. Previous works leverage logical forms to facilitate logical knowledge-conditioned text \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:UFA, author = "Yuanzhi Liu and Min He and Qingqing Yang and Gwanggil Jeon", title = "An Unsupervised Framework With Attention Mechanism and Embedding Perturbed Encoder for Non-Parallel Text Sentiment Style Transfer", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2134--2144", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3278185", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3278185", abstract = "Text sentiment style transfer aims to extract the sentiment words from a sentence and transfer them into another expected sentiment style while retaining the original sentence's content. However, previous works have not achieved satisfactory \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ai:2023:AAF, author = "Yang Ai and Zhen-Hua Ling", title = "{APNet}: an All-Frame-Level Neural Vocoder Incorporating Direct Prediction of Amplitude and Phase Spectra", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2145--2157", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3277276", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3277276", abstract = "This paper presents a novel neural vocoder named APNet which reconstructs speech waveforms from acoustic features by predicting amplitude and phase spectra directly. The APNet vocoder is composed of an amplitude spectrum predictor (ASP) and a phase \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2023:LCC, author = "Fei Zhao and Zhen Wu and Liang He and Xin-Yu Dai", title = "Label-Correction Capsule Network for Hierarchical Text Classification", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2158--2168", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3282099", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3282099", abstract = "Hierarchical Text Classification (HTC) aims to predict the category of a document in a given label hierarchy. Considering a parent-child relationship among labels at different levels, previous works mainly leverage the parent-level label information to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Subakan:2023:ESA, author = "Cem Subakan and Mirco Ravanelli and Samuele Cornell and Fran{\c{c}}ois Grondin and Mirko Bronzi", title = "Exploring Self-Attention Mechanisms for Speech Separation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2169--2180", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3282097", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3282097", abstract = "Transformers have enabled impressive improvements in deep learning. They often outperform recurrent and convolutional models in many tasks while taking advantage of parallel processing. Recently, we proposed the SepFormer, which obtains state-of-the-art \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:NMC, author = "Chenggang Zhang and Jinjiang Liu and Hao Li and Xueliang Zhang", title = "Neural Multi-Channel and Multi-Microphone Acoustic Echo Cancellation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2181--2192", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3282103", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3282103", abstract = "Deep learning is introduced in multi-channel (MC) and multi-microphone (MM) acoustic echo cancellation (AEC) without decorrelation to the loudspeaker signals and achieves remarkable performance. In this article, we propose a complex spectral mapping \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:DTI, author = "Zheng Liu and Xin Kang and Fuji Ren", title = "Dual-{TBNet}: Improving the Robustness of Speech Features via Dual-Transformer-{BiLSTM} for Speech Emotion Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2193--2203", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3282092", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3282092", abstract = "Speech emotion recognition has always been one of the topics that have attracted a lot of attention from many researchers. In traditional feature fusion methods, the speech features used only come from the data set, and the weak robustness of features can \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cumani:2023:DUS, author = "Sandro Cumani and Salvatore Sarni", title = "The Distributions of Uncalibrated Speaker Verification Scores: a Generative Model for Domain Mismatch and Trial-Dependent Calibration", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2204--2219", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3282096", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3282096", abstract = "Speaker verification systems that compute log-likelihood ratios (LLR) between the same and different speaker hypotheses allow for cost-effective decisions that depend only on prior information. Domain mismatch, inaccurate model assumptions or the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ai:2023:CML, author = "Xi Ai and Bin Fang", title = "Cross-Modal Language Modeling in Multi-Motion-Informed Context for Lip Reading", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2220--2232", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3282109", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3282109", abstract = "We observe that for lip reading, the language is locally transformed, instead of globally transformed, i.e., speaking and writing follow the same basic grammar rules. In this work, we present a cross-modal language model to tackle the lip-reading \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fuglsig:2023:MPN, author = "Andreas Jonas Fuglsig and Jesper Jensen and Zheng-Hua Tan and Lars S{\o}ndergaard Bertelsen and Jens Christian Lindof and Jan {\O}stergaard", title = "Minimum Processing Near-End Listening Enhancement", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2233--2245", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3282094", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3282094", abstract = "The intelligibility and quality of speech from a mobile phone or public announcement system are often affected by background noise in the listening environment. By pre-processing the speech signal it is possible to improve the speech intelligibility and \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xie:2023:TTA, author = "Zhiwen Xie and Runjie Zhu and Jin Liu and Guangyou Zhou and Jimmy Xiangji Huang", title = "{TARGAT}: a Time-Aware Relational Graph Attention Model for Temporal Knowledge Graph Embedding", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2246--2258", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3282101", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3282101", abstract = "Temporal knowledge graph embedding (TKGE) aims to learn the embedding of entities and relations in a temporal knowledge graph (TKG). Although the previous graph neural networks (GNN) based models have achieved promising results, they cannot directly \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:OQC, author = "Cuilian Zhang and Derek F. Wong and Eddy S. K. Lei and Runzhe Zhan and Lidia S. Chao", title = "Obscurity-Quantified Curriculum Learning for Machine Translation Evaluation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2259--2271", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3282105", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3282105", abstract = "The pre-trained language model has been developed for evaluating the quality of machine translation. It achieves state-of-the-art results. However, building a model for the evaluation of machine translation still faces the following challenges: (1) large \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:HEE, author = "Yaxin Liu and Yan Zhou and Ziming Li and Junlin Wang and Wei Zhou and Songlin Hu", title = "{HIM}: an End-to-End Hierarchical Interaction Model for Aspect Sentiment Triplet Extraction", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2272--2285", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3282379", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3282379", abstract = "Aspect Sentiment Triplet Extraction (ASTE) is an emerging task of fine-grained sentiment analysis, which aims to extract aspect terms, associated opinion terms, and sentiment polarities in the form of triplets. Thus, ASTE involves two groups of subtasks: \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wakabayashi:2023:SFI, author = "Yukoh Wakabayashi and Kouei Yamaoka and Nobutaka Ono", title = "Sound Field Interpolation for Rotation-Invariant Multichannel Array Signal Processing", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2286--2298", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3282098", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3282098", abstract = "In this paper, we present a sound field interpolation for array signal processing (ASP) that is robust to rotation of a circular microphone array (CMA), and we evaluate beamforming as one of its applications. Most ASP methods assume a time-invariant \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nielsen:2023:ATN, author = "Jesper Kj{\ae}r Nielsen and Mads Gr{\ae}sb{\o}ll Christensen and Jesper B{\"u}nsow Boldt", title = "An Analysis of Traditional Noise Power Spectral Density Estimators Based on the {Gaussian} Stochastic Volatility Model", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2299--2313", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3282107", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3282107", abstract = "Many single- and multi-channel speech enhancement techniques, old and new, rely in one way or another on estimates of the noise power spectral density (PSD). For example, the classical Wiener filter requires that either the speech or noise PSD be \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jacome:2023:SEL, author = "Karen Gissell Rosero Jacome and Felipe Leonel Grijalva and Bruno Sanches Masiero", title = "Sound Events Localization and Detection Using Bio-Inspired Gammatone Filters and Temporal Convolutional Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2314--2324", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3284525", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3284525", abstract = "The auditory brain circuits are biologically constructed to recand localize sounds by encoding a combination of cues that help individuals interpret sounds. The development of computational methods inspired by human capacities has established \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yuan:2023:RGR, author = "Lin Yuan and Guoheng Huang and Fenghuan Li and Xiaochen Yuan and Chi-Man Pun and Guo Zhong", title = "{RBA-GCN}: Relational Bilevel Aggregation Graph Convolutional Network for Emotion Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2325--2337", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3284509", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3284509", abstract = "Emotion recognition in conversation (ERC) has received increasing attention from researchers due to its wide range of applications. As conversation has a natural graph structure, numerous approaches used to model ERC based on graph convolutional networks \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Poirot:2023:PES, author = "Samuel Poirot and Stefan Bilbao and Mitsuko Aramaki and S{\o}lvi Ystad and Richard Kronland-Martinet", title = "A Perceptually Evaluated Signal Model: Collisions Between a Vibrating Object and an Obstacle", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2338--2350", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3284515", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3284515", abstract = "The collision interaction mechanism between a vibrating string and a non-resonant obstacle is at the heart of many musical instruments. This article focuses on the identification of perceptually salient auditory features related to this phenomenon. The \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Richter:2023:SED, author = "Julius Richter and Simon Welker and Jean-Marie Lemercier and Bunlong Lay and Timo Gerkmann", title = "Speech Enhancement and Dereverberation With Diffusion-Based Generative Models", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2351--2364", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3285241", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3285241", abstract = "In this work, we build upon our previous publication and use diffusion-based generative models for speech enhancement. We present a detailed overview of the diffusion process that is based on a stochastic differential equation and delve into an extensive \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Barysenka:2023:SBI, author = "Siarhei Y. Barysenka and Vasili I. Vorobiov", title = "{SNR}-Based Inter-Component Phase Estimation Using Bi-Phase Prior Statistics for Single-Channel Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2365--2381", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3284514", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3284514", abstract = "The fundamental problem of phase-aware single-channel speech enhancement is the estimation of the harmonic phase of signal components from noisy observations. One approach to obtain an estimate of the harmonic phase is by smoothing the noisy harmonic \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zeng:2023:ESR, author = "Jiandian Zeng and Jiantao Zhou and Caishi Huang", title = "Exploring Semantic Relations for Social Media Sentiment Analysis", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2382--2394", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3285238", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3285238", abstract = "With the massive social media data available online, the conventional single modality emotion classification has developed into more complex models of multimodal sentiment analysis. Most existing works simply extracted image features at a coarse level, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Drakopoulos:2023:NNF, author = "Fotios Drakopoulos and Sarah Verhulst", title = "A Neural-Network Framework for the Design of Individualised Hearing-Loss Compensation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2395--2409", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3282093", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3282093", abstract = "Sound processing in the human auditory system is complex and highly non-linear, whereas hearing aids (HAs) still rely on simplified descriptions of auditory processing or hearing loss to restore hearing. Even though standard HA amplification strategies \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ma:2023:ESA, author = "Xinbei Ma and Zhuosheng Zhang and Hai Zhao", title = "Enhanced Speaker-Aware Multi-Party Multi-Turn Dialogue Comprehension", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2410--2423", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3284516", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3284516", abstract = "Multi- party multi-turn dialogue comprehension brings unprecedented challenges in handling complicated scenarios, as the co-occurrence of multiple speakers causes complexity and inconsistency. As a result of the multiple participation, the shift of speaker \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2023:HAM, author = "Tianrui Wang and Weibin Zhu and Yingying Gao and Shilei Zhang and Junlan Feng", title = "Harmonic Attention for Monaural Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2424--2436", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3284522", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3284522", abstract = "To further improve the quality of the enhanced speech, it is appealing that more profound articulatory and auditory knowledge should be introduced into the speech enhancement model. Among these, harmonics seriously affect speech timbre and play a crucial \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lei:2023:MCK, author = "Lei Lei and Guoshun Yuan and Hongjiang Yu and Dewei Kong and Yuefeng He", title = "Multilingual Customized Keyword Spotting Using Similar-Pair Contrastive Learning", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2437--2447", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3284523", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3284523", abstract = "The goal of keyword spotting (KWS) is to find words and voice commands. KWS research has received a lot of attention recently. However, the majority of them emphasize predefined KWS. More often than not, customers wish to choose individualized unique \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:MSD, author = "Shaokai Li and Peng Song and Wenming Zheng", title = "Multi-Source Discriminant Subspace Alignment for Cross-Domain Speech Emotion Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2448--2460", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3288415", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3288415", abstract = "Cross- domain speech emotion recognition (SER) is an effective strategy to improve the generalization ability of emotion classification models, which is an important research direction in speech signal processing. However, since the speech signals are non-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ren:2023:GVS, author = "Yeqing Ren and Haipeng Peng and Lixiang Li and Xiaopeng Xue and Yang Lan and Yixian Yang", title = "Generalized Voice Spoofing Detection via Integral Knowledge Amalgamation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2461--2475", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3288416", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3288416", abstract = "Most of the voice spoofing detection methods are designed for specific kinds of spoofing attacks, synthetic or replay. In practice, however, there is no prior information about these two kinds of spoofing attacks. To this end, this paper proposes a \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2023:LLM, author = "Xing Chen and Jie Wang and Xiao-Lei Zhang and Wei-Qiang Zhang and Kunde Yang", title = "{LMD}: a Learnable Mask Network to Detect Adversarial Examples for Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2476--2490", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3288417", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3288417", abstract = "Although the security of automatic speaker verification (ASV) is seriously threatened by recently emerged adversarial attacks, there have been some countermeasures to alleviate the threat. However, many defense approaches not only require the prior \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yen:2023:RNA, author = "Benjamin Yen and Yameizhen Li and Yusuke Hioka", title = "Rotor Noise-Aware Noise Covariance Matrix Estimation for Unmanned Aerial Vehicle Audition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2491--2506", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3288410", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3288410", abstract = "A noise covariance matrix (NCM) estimation method for unmanned aerial vehicle (UAV) audition is proposed with rotor noise reduction as its primary focus. The proposed NCM estimation method could be incorporated into audio processing algorithms using UAV-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:ATS, author = "Xuechen Liu and Xin Wang and Md Sahidullah and Jose Patino and H{\'e}ctor Delgado and Tomi Kinnunen and Massimiliano Todisco and Junichi Yamagishi and Nicholas Evans and Andreas Nautsch and Kong Aik Lee", title = "{ASVspoof 2021}: Towards Spoofed and Deepfake Speech Detection in the Wild", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2507--2522", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3285283", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3285283", abstract = "Benchmarking initiatives support the meaningful comparison of competing solutions to prominent problems in speech and language processing. Successive benchmarking evaluations typically reflect a progressive evolution from ideal lab conditions towards to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Borsos:2023:ALM, author = "Zal{\'a}n Borsos and Rapha{\"e}l Marinier and Damien Vincent and Eugene Kharitonov and Olivier Pietquin and Matt Sharifi and Dominik Roblek and Olivier Teboul and David Grangier and Marco Tagliasacchi and Neil Zeghidour", title = "{AudioLM}: a Language Modeling Approach to Audio Generation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2523--2533", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3288409", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3288409", abstract = "We introduce AudioLM, a framework for high-quality audio generation with long-term consistency. AudioLM maps the input audio to a sequence of discrete tokens and casts audio generation as a language modeling task in this representation space. We show how \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:MTI, author = "Xingfeng Li and Xiaohan Shi and Desheng Hu and Yongwei Li and Qingchen Zhang and Zhengxia Wang and Masashi Unoki and Masato Akagi", title = "Music Theory-Inspired Acoustic Representation for Speech Emotion Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2534--2547", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3289312", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3289312", abstract = "This research presents a music theory-inspired acoustic representation (hereafter, MTAR) to address improved speech emotion recognition. The recognition of emotion in speech and music is developed in parallel, yet a relatively limited understanding of \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lian:2023:UTA, author = "Jiachen Lian and Chunlei Zhang and Gopala K. Anumanchipalli and Dong Yu", title = "Unsupervised {TTS} Acoustic Modeling for {TTS} With Conditional Disentangled Sequential {VAE}", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2548--2557", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3290423", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3290423", abstract = "In this paper, we propose a novel unsupervised text-to-speech acoustic model training scheme, named UTTS, which does not require text-audio pairs. UTTS is a multi-speaker speech synthesizer that supports zero-shot voice cloning, it is developed from a \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Malik:2023:PLD, author = "Arsalan Malik and Nipun Agarwal and Harshavardhan Settibhaktini and Ananthakrishna Chintanpalli", title = "Predicting Level-Dependent Changes in Concurrent Vowel Scores Using the {$2$D-CNN} Models", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2558--2566", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3288411", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3288411", abstract = "Differences in fundamental frequencies (F0s) are an important cue for segregating multiple speakers. However, the ability to avail this cue for identification varies with sound levels. For different-and same-F0 conditions, the identification scores of \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Krause:2023:HCI, author = "Michael Krause and Meinard M{\"u}ller", title = "Hierarchical Classification for Instrument Activity Detection in Orchestral Music Recordings", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2567--2578", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3291506", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3291506", abstract = "Instrument activity detection is a fundamental task in music information retrieval, serving as a basis for many applications, such as music recommendation, music tagging, or remixing. Most published works on this task cover popular music and music for \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Meyer:2023:VHR, author = "Julie Meyer and Sebastian Prepeli{\c{t}}{\u{a}} and Ali Khajeh-Saeed and Michael Smirnov and Pablo Hoffmann", title = "Verification on Head-Related Transfer Functions of a Snowman Model Simulated Using the Finite-Difference Time-Domain Method", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2579--2591", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3291529", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3291529", abstract = "Although finite-difference time-domain (FDTD) simulations are extensively used in acoustics, studies assessing the reliability and the accuracy of the implemented method are scarce. Moreover, the operational validity of a simulation method is context-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Petermann:2023:TCF, author = "Darius Petermann and Gordon Wichern and Aswin Shanmugam Subramanian and Zhong-Qiu Wang and Jonathan {Le Roux}", title = "Tackling the Cocktail Fork Problem for Separation and Transcription of Real-World Soundtracks", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2592--2605", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3290428", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3290428", abstract = "Emulating the human ability to solve the cocktail party problem, i.e., focus on a source of interest in a complex acoustic scene, is a long standing goal of audio source separation research. In this paper, we focus on the cocktail fork problem, which \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cao:2023:DWE, author = "Hailong Cao and Liguo Li and Conghui Zhu and Muyun Yang and Tiejun Zhao", title = "Dual Word Embedding for Robust Unsupervised Bilingual Lexicon Induction", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2606--2615", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3290425", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3290425", abstract = "The word embedding models such as Word2vec and FastText simultaneously learn dual representations of input vectors and output vectors. In contrast, almost all existing unsupervised bilingual lexicon induction (UBLI) methods use only input vectors without \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xiao:2023:TAP, author = "Lin Xiao and Pengyu Xu and Mingyang Song and Huafeng Liu and Liping Jing and Xiangliang Zhang", title = "Triple Alliance Prototype Orthotist Network for Long-Tailed Multi-Label Text Classification", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2616--2628", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3265860", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3265860", abstract = "Multi- label text classification (MLTC) aims to tag the most relevant labels for the given document. Compared to the standard multi-class case where each document has only one label, it is considerably more difficulty to annotate new coming documents for \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:UIK, author = "Juhua Liu and Qihuang Zhong and Liang Ding and Hua Jin and Bo Du and Dacheng Tao", title = "Unified Instance and Knowledge Alignment Pretraining for Aspect-Based Sentiment Analysis", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2629--2642", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3290431", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3290431", abstract = "The goal of aspect-based sentiment analysis (ABSA) is to determine the sentiment polarity towards an aspect. Because of the expensive and limited amounts of labelled data, the pretraining strategy has become the de facto standard for ABSA. However, there \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:AAC, author = "Yiming Zhang and Hong Yu and Ruoyi Du and Zheng-Hua Tan and Wenwu Wang and Zhanyu Ma and Yuan Dong", title = "{ACTUAL}: Audio Captioning With Caption Feature Space Regularization", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2643--2657", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3293015", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3293015", abstract = "Audio captioning aims at describing the content of audio clips with human language. Due to the ambiguity of audio content, different people may perceive the same audio clip differently, resulting in caption disparities \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Abesser:2023:HRA, author = "Jakob Abe{\ss}er and Sascha Grollmisch and Meinard M{\"u}ller", title = "How Robust are Audio Embeddings for Polyphonic Sound Event Tagging?", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2658--2667", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3293032", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3293032", abstract = "Sound classification algorithms are challenged by the natural variability of everyday sounds, particularly for large sound class taxonomies. In order to be applicable in real-life environments, such algorithms must also be able to handle polyphonic \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xia:2023:ADB, author = "Wei Xia and John H. L. Hansen", title = "Attention and {DCT} Based Global Context Modeling for Text-Independent Speaker Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2668--2679", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3284521", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3284521", abstract = "Learning an effective speaker representation is crucial for achieving reliable performance in speaker verification tasks. Speech signals are high-dimensional, long, and variable-length sequences containing diverse information at each time-frequency (TF) \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hasumi:2023:PIP, author = "Takuya Hasumi and Tomohiko Nakamura and Norihiro Takamune and Hiroshi Saruwatari and Daichi Kitamura and Yu Takahashi and Kazunobu Kondo", title = "{PoP-IDLMA}: Product-of-Prior Independent Deeply Learned Matrix Analysis for Multichannel Music Source Separation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2680--2694", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3293044", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3293044", abstract = "Independent deeply learned matrix analysis (IDLMA) is a state-of-the-art determined audio source separation method based on pretrained deep neural networks (DNNs). Owing to the excellent expression power of DNNs, IDLMA can handle a wider range of sources \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:CCB, author = "Ben Liu and Jun Wang and Guanyuan Yu and Shaolei Chen", title = "{CUPVC}: a Constraint-Based Unsupervised Prosody Transfer for Improving Telephone Banking Services", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2695--2706", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3293042", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3293042", abstract = "Low efficiency in telephone banking services reduces customer satisfaction. Therefore, some recent studies have concentrated on applying voice conversion models to improve telephone banking services. However, building such a model raises three huge \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:AVE, author = "Guinan Li and Jiajun Deng and Mengzhe Geng and Zengrui Jin and Tianzi Wang and Shujie Hu and Mingyu Cui and Helen Meng and Xunying Liu", title = "Audio-Visual End-to-End Multi-Channel Speech Separation, Dereverberation and Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2707--2723", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3294705", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3294705", abstract = "Accurate recognition of cocktail party speech containing overlapping speakers, noise and reverberation remains a highly challenging task to date. Motivated by the invariance of visual modality to acoustic signal corruption, an audio-visual multi-channel \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lemercier:2023:SDB, author = "Jean-Marie Lemercier and Julius Richter and Simon Welker and Timo Gerkmann", title = "{StoRM}: a Diffusion-Based Stochastic Regeneration Model for Speech Enhancement and Dereverberation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2724--2737", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3294692", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3294692", abstract = "Diffusion models have shown a great ability at bridging the performance gap between predictive and generative approaches for speech enhancement. We have shown that they may even outperform their predictive counterparts for non-additive corruption types or \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lu:2023:ISE, author = "Yen-Ju Lu and Chia-Yu Chang and Cheng Yu and Ching-Feng Liu and Jeih-weih Hung and Shinji Watanabe and Yu Tsao", title = "Improving Speech Enhancement Performance by Leveraging Contextual Broad Phonetic Class Information", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2738--2750", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3288418", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3288418", abstract = "Previous studies have confirmed that by augmenting acoustic features with the place/manner of articulatory features, the speech enhancement (SE) process can be guided to consider the broad phonetic properties of the input speech when performing \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kim:2023:MSM, author = "Sungjae Kim and Yewon Kim and Jewoo Jun and Injung Kim", title = "{MuSE-SVS}: Multi-Singer Emotional Singing Voice Synthesizer That Controls Emotional Intensity", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2751--2764", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3294712", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3294712", abstract = "We propose a multi-singer emotional singing voice synthesizer, Muse-SVS, that expresses emotion at various intensity levels by controlling subtle changes in pitch, energy, and phoneme duration while accurately following the score. To control multiple \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Su:2023:RTD, author = "Xinxin Su and Zhen Huang and Yunxiang Zhao and Yifan Chen and Yong Dou and Hengyue Pan", title = "Recent Trends in Deep Learning Based Textual Emotion Cause Extraction", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2765--2786", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3254166", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3254166", abstract = "Emotion Cause Extraction Field (ECEF) focuses on the cause that triggers an emotion in a document. Traditional ECEF aims to extract the cause based on a given emotion while recent ECEF focuses more on extracting both the emotion and its corresponding \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lu:2023:HSD, author = "Junyu Lu and Hongfei Lin and Xiaokun Zhang and Zhaoqing Li and Tongyue Zhang and Linlin Zong and Fenglong Ma and Bo Xu", title = "Hate Speech Detection via Dual Contrastive Learning", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2787--2795", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3294715", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3294715", abstract = "The fast spread of hate speech on social media impacts the Internet environment and our society by increasing prejudice and hurting people. Detecting hate speech has aroused broad attention in the field of natural language processing. Although hate speech \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{doCarmo:2023:CFS, author = "Diego Marques do Carmo and Ricardo A. Borsoi and M{\'a}rcio Holsbach Costa", title = "Closed-Form Solution to the Multichannel {Wiener} Filter With Interaural Level Difference Preservation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2796--2811", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3291530", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3291530", abstract = "This article presents a multichannel Wiener filter (MWF) based noise reduction method with preservation of the interaural level difference (ILD). It minimizes the MWF cost function subject to two constraints for ILD preservation. Under this approach, the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:PMP, author = "Ya-Jie Zhang and Chao Zhang and Wei Song and Zhengchen Zhang and Youzheng Wu and Xiaodong He", title = "Prosody Modelling With Pre-Trained Cross-Utterance Representations for Improved Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2812--2823", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3278184", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3278184", abstract = "When humans speak multiple utterances in a continuous manner, the prosodic features generated in each utterance are related to those in its neighbouring utterances. Such cross-utterance (CU) dependencies are often ignored by the current neural text-to-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chiu:2023:LPB, author = "Ching-Yu Chiu and Meinard M{\"u}ller and Matthew E. P. Davies and Alvin Wen-Yu Su and Yi-Hsuan Yang", title = "Local Periodicity-Based Beat Tracking for Expressive Classical Piano Music", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2824--2835", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3297956", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3297956", abstract = "To model the periodicity of beats, state-of-the-art beat tracking systems use ``post-processing trackers'' (PPTs) that rely on several empirically determined global assumptions for tempo transition, which work well for music with a steady \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2023:NMD, author = "Feng Chen and Ke Ma and Yapeng Mao and Desen Yang and Yi Zhang and Jie Shi and Shiqi Mo and Gui Chenyang and Song Li", title = "A Novel Method to Design Steerable Differential Beamformer Using Linear Acoustics Vector Sensor Array", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2836--2849", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3297960", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3297960", abstract = "Differential beamforming techniques have gained significant attention due to their frequency-independent beampatterns, applicability for small apertures, and super-directivity. It is commonly known that the main lobe of a beam pattern based on a linear \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Huang:2023:UDK, author = "Tianyu Huang and Weisheng Dong and Fangfang Wu and Xin Li and Guangming Shi", title = "Uncertainty-Driven Knowledge Distillation for Language Model Compression", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2850--2858", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3289303", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3289303", abstract = "Despite the remarkable performance on various Natural Language Processing (NLP) tasks, the parametric complexity of pretrained language models has remained a major obstacle due to limited computational resources in many practical applications. Techniques \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Carofilis:2023:IAC, author = "Andr{\'e}s Carofilis and Enrique Alegre and Eduardo Fidalgo and Laura Fern{\'a}ndez-Robles", title = "Improvement of Accent Classification Models Through Grad-Transfer From Spectrograms and Gradient-Weighted Class Activation Mapping", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2859--2871", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3297961", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3297961", abstract = "Automatic accent classification is an active research field concerning speech processing. It can be useful to identify a speaker's region of origin, which can be applied in police investigations carried out by Law Enforcement Agencies, as well as \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hollebon:2023:HOS, author = "Jacob Hollebon and Filippo Maria Fazi", title = "Higher-Order Stereophony", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2872--2885", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3297953", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3297953", abstract = "This work introduces a new theory for spatial audio recording and reproduction named Higher Order Stereophony. Through the use of the Taylor expansion, the technique accurately reproduces a sound field across a line that is orientated as the interaural \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wong:2023:MIR, author = "Jeremy H. M. Wong and Huayun Zhang and Nancy F. Chen", title = "Modelling Inter-Rater Uncertainty in Spoken Language Assessment", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2886--2898", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3297958", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3297958", abstract = "In a subjective task, such as Spoken Language Assessment (SLA), the reference scores provided by different human raters may vary. A collection of annotated scores from multiple raters can be interpreted as an expression of data uncertainty. Previous \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zheng:2023:EIC, author = "Qinghua Zheng and Yuefei Wu and Guangtao Wang and Yanping Chen and Wei Wu and Zai Zhang and Bin Shi and Bo Dong", title = "Exploring Interactive and Contrastive Relations for Nested Named Entity Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2899--2909", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3293047", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3293047", abstract = "Nested named entities (nested NEs) refer to the situation where one named entity is included or nested within another named entity, which cannot be recognized by the traditional sequence labeling methods. Recently, span-based methods have become the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shi:2023:TLC, author = "Dongyuan Shi and Woon-Seng Gan and Bhan Lam and Zhengding Luo and Xiaoyi Shen", title = "Transferable Latent of {CNN}-Based Selective Fixed-Filter Active Noise Control", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2910--2921", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3261757", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3261757", abstract = "Practical active noise control (ANC) systems, like the active noise cancellation headphone, usually adopt a control filter with preset coefficients to achieve satisfactory noise reduction performance for dynamic noise and higher robustness. In this \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Desblancs:2023:ZNS, author = "Dorian Desblancs and Vincent Lostanlen and Romain Hennequin", title = "Zero-Note Samba: Self-Supervised Beat Tracking", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2922--2934", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3297963", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3297963", abstract = "Supervised machine learning for music information retrieval requires a large annotated training set, and is thus an expensive and time-consuming process. To circumvent this problem, we propose to train deep neural networks to perceive beats in musical \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lin:2023:CXC, author = "Nankai Lin and Yingwen Fu and Xiaotian Lin and Dong Zhou and Aimin Yang and Shengyi Jiang", title = "{CL-XABSA}: Contrastive Learning for Cross-Lingual Aspect-Based Sentiment Analysis", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2935--2946", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3297964", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3297964", abstract = "Aspect- based sentiment analysis (ABSA), an extensively researched area in the field of natural language processing (NLP), predicts the sentiment expressed in a text relative to the corresponding aspect. Unfortunately, most languages lack sufficient \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:LID, author = "Hanmeng Liu and Jian Liu and Leyang Cui and Zhiyang Teng and Nan Duan and Ming Zhou and Yue Zhang", title = "{LogiQA 2.0} --- an Improved Dataset for Logical Reasoning in Natural Language Understanding", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2947--2962", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3293046", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3293046", abstract = "NLP research on logical reasoning regains momentum with the recent releases of a handful of datasets, notably LogiQA and Reclor. Logical reasoning is exploited in many probing tasks over large Pre-trained Language Models (PLMs) and downstream tasks like \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yi:2023:AMT, author = "Jiangyan Yi and Jianhua Tao and Ruibo Fu and Tao Wang and Chu Yuan Zhang and Chenglong Wang", title = "Adversarial Multi-Task Learning for {Mandarin} Prosodic Boundary Prediction With Multi-Modal Embeddings", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2963--2973", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3301235", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3301235", abstract = "Prosodic boundaries are still crucial to the naturalness of end-to-end speech synthesis systems. This article proposes to use adversarial multi-task learning to predict prosodic boundaries. Adversarial multi-task learning is utilized to transfer knowledge \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yoon:2023:OTL, author = "Ji Won Yoon and Hyung Yong Kim and Hyeonseung Lee and Sunghwan Ahn and Nam Soo Kim", title = "Oracle Teacher: Leveraging Target Information for Better Knowledge Distillation of {CTC} Models", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2974--2987", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3297955", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3297955", abstract = "Knowledge distillation (KD), best known as an effective method for model compression, aims at transferring the knowledge of a bigger network (teacher) to a much smaller network (student). Conventional KD methods usually employ the teacher model trained in \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Duan:2023:SAD, author = "Sufeng Duan and Hai Zhao and Dongdong Zhang", title = "Syntax-Aware Data Augmentation for Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "2988--2999", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3301214", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3301214", abstract = "Data augmentation is an effective method for the performance enhancement of neural machine translation (NMT) by generating additional bilingual data. In this article, we propose a novel data augmentation strategy for neural machine translation. Unlike \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:HRM, author = "Tongzheng Liu and Zhihua Lu and Jo{\~a}o Paulo J. da Costa and Tai Fei", title = "A Hybrid Reverberation Model and Its Application to Joint Speech Dereverberation and Separation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3000--3014", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3301227", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3301227", abstract = "This article proposes a hybrid reverberation model by integrating two conventional models, namely, the multichannel linear prediction (MCLP) model and the spatial coherence model. The late reverberation is divided into two components. One component is \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Guo:2023:LLP, author = "Junjun Guo and Junjie Ye and Yan Xiang and Zhengtao Yu", title = "Layer-Level Progressive Transformer With Modality Difference Awareness for Multi-Modal Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3015--3026", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3301210", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3301210", abstract = "Multi- modal neural machine translation (MNMT) aims to translate sentences from the source language into the target language with the aid of corresponding images. Unfortunately, there is a considerable modality gap between the semantic-related images and \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tao:2023:NUA, author = "Qian Tao and Zhihao Xiong and Bocheng Han and Xiaoyang Fan and Lusi Li", title = "A Novel Unsupervised Approach for Cross-Lingual Word Alignment in Low Isomorphic Embedding Spaces", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3027--3041", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3301208", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3301208", abstract = "Cross- lingual word alignment is the task for word translation between monolingual word embedding spaces of two different languages. Recent work is mostly based on supervised approaches, while their success relies on bilingual seed dictionaries derived \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jin:2023:DBG, author = "Jilu Jin and Jacob Benesty and Jingdong Chen and Gongping Huang", title = "Differential Beamforming From a Geometric Perspective", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3042--3054", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3301245", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3301245", abstract = "Differential microphone arrays (DMAs) have demonstrated a great potential for solving the high-fidelity sound acquisition problem in a wide range of applications as they possess many good properties such as frequency-independent beampatterns with high \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Palomo-Alonso:2023:FAU, author = "Alberto Palomo-Alonso and David Casillas-P{\'e}rez and Silvia Jim{\'e}nez-Fern{\'a}ndez and Jose A. Portilla-Figueras and Sancho Salcedo-Sanz", title = "A Flexible Architecture Using Temporal, Spatial and Semantic Correlation-Based Algorithms for Story Segmentation of Broadcast News", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3055--3069", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3301231", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3301231", abstract = "In this article, we propose a novel flexible architecture, with different algorithmic procedures, for effective story segmentation of broadcast news from subtitle files. The proposed system exploits spatial and temporal distance, as well as sentence \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yusuf:2023:EEO, author = "Bolaji Yusuf and Jan {\v{C}}ernock{\'y} and Murat Sara{\c{c}}lar", title = "End-to-End Open Vocabulary Keyword Search With Multilingual Neural Representations", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3070--3080", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3301239", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3301239", abstract = "Conventional keyword search systems operate on automatic speech recognition (ASR) outputs, which causes them to have a complex indexing and search pipeline. This has led to interest in ASR-free approaches to simplify the search procedure. We recently \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Herzog:2023:AJA, author = "Adrian Herzog and Srikanth Raj Chetupalli and Emanu{\"e}l A. P. Habets", title = "{AmbiSep}: Joint Ambisonic-to-Ambisonic Speech Separation and Noise Reduction", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3081--3094", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3297954", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3297954", abstract = "Blind separation of the sounds in an Ambisonic sound scene is a challenging problem, especially when the spatial impression of these sounds needs to be preserved. In this work, we consider Ambisonic-to-Ambisonic separation of reverberant speech mixtures, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hsu:2023:PSA, author = "Po-chun Hsu and Da-rong Liu and Andy T. Liu and Hung-yi Lee", title = "Parallel Synthesis for Autoregressive Speech Generation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3095--3111", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3301212", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3301212", abstract = "Autoregressive neural vocoders have achieved outstanding performance in speech synthesis tasks such as text-to-speech and voice conversion. An autoregressive vocoder predicts a sample at some time step conditioned on those at previous time steps. Though \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dalmia:2023:LBM, author = "Siddharth Dalmia and Dmytro Okhonko and Mike Lewis and Sergey Edunov and Shinji Watanabe and Florian Metze and Luke Zettlemoyer and Abdelrahman Mohamed", title = "{LegoNN}: Building Modular Encoder-Decoder Models", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3112--3126", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3296019", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3296019", abstract = "State- of-the-art encoder-decoder models (e.g. for machine translation (MT) or automatic speech recognition (ASR)) are constructed and trained end-to-end as an atomic unit. No component of the model can be (re-)used without the others, making it impossible \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gajecki:2023:DLF, author = "Tom Gajecki and Waldo Nogueira", title = "Deep Latent Fusion Layers for Binaural Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3127--3138", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3301223", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3301223", abstract = "This work addresses the issue of enhancing speech in binaural hearing scenarios. Specifically, we present a method to improve binaural noise reduction by integrating latent features produced by monaural speech enhancement algorithms through the use of \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Feng:2023:PBS, author = "Huawen Feng and Zhenxi Lin and Qianli Ma", title = "Perturbation-Based Self-Supervised Attention for Attention Bias in Text Classification", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3139--3151", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3302230", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3302230", abstract = "In text classification, the traditional attention mechanisms usually focus too much on frequent words, and need extensive labeled data in order to learn. This article proposes a perturbation-based self-supervised attention approach to guide attention \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhong:2023:SSS, author = "Jiaxin Zhong and Tao Zhuang and Mengtong Li and Ray Kirby and Mahmoud Karimi and Jing Lu and Dong Zhang", title = "Sidelobe Suppression for a Steerable Parametric Source Using the Sparse Random Array Technique", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3152--3161", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3304491", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3304491", abstract = "A steerable parametric source is designed to steer an audio beam without mechanically rotating the source. To achieve this without the generation of grating lobes requires an ultrasonic array with interelement spacing that is less than half the wavelength \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fang:2023:CCS, author = "Yan Fang and Wei Lu and Xiaodong Liu and Witold Pedrycz and Qi Lang and Jianhua Yang", title = "{CircularE}: a Complex Space Circular Correlation Relational Model for Link Prediction in Knowledge Graph Embedding", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3162--3175", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3297959", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3297959", abstract = "Knowledge graphs are regarded as structured knowledge bases that embody various facts coming from the real world. Their completeness is still far from satisfactory. Relational learning models in link prediction can automatically find the missing \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:SSS, author = "Jie Zhang and Rui Tao and Jun Du and Li-Rong Dai", title = "{SDW-SWF}: Speech Distortion Weighted Single-Channel {Wiener} Filter for Noise Reduction", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3176--3189", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3304474", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3304474", abstract = "Speech enhancement shows an important necessity in many audio applications, particularly in noisy environments, where the speech quality needs to be improved. In this work, we consider the single-channel noise reduction (NR) problem from the conventional \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:AFN, author = "Haozhou Li and Qinke Peng and Xu Mou and Ying Wang and Zeyuan Zeng and Muhammad Fiaz Bashir", title = "Abstractive Financial News Summarization via Transformer-{BiLSTM} Encoder and Graph Attention-Based Decoder", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3190--3205", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3304473", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3304473", abstract = "Financial news summarization (FNS) has been an attractive research problem in recent years, which aims to generate a shorter highlight of the news article while preserving key factual aspects, emotions, and opinions, providing significant assistance in \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yuan:2023:UDU, author = "Weitao Yuan and Shengbei Wang and Jianming Wang and Masashi Unoki and Wenwu Wang", title = "Unsupervised Deep Unfolded Representation Learning for Singing Voice Separation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3206--3220", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3302237", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3302237", abstract = "Learning effective vocal representations from a waveform mixture is a crucial but challenging task for deep neural network (DNN)-based singing voice separation (SVS). Successful representation learning (RL) depends heavily on well-designed neural \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2023:TGI, author = "Zhong-Qiu Wang and Samuele Cornell and Shukjae Choi and Younglo Lee and Byeong-Yeol Kim and Shinji Watanabe", title = "{TF-GridNet}: Integrating Full- and Sub-Band Modeling for Speech Separation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3221--3236", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3304482", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3304482", abstract = "We propose TF-GridNet for speech separation. The model is a novel deep neural network (DNN) integrating full- and sub-band modeling in the time-frequency (T-F) domain. It stacks several blocks, each consisting of an intra-frame full-band module, a sub-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tammen:2023:PEP, author = "Marvin Tammen and Simon Doclo", title = "Parameter Estimation Procedures for Deep Multi-Frame {MVDR} Filtering for Single-Microphone Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3237--3248", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3306715", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3306715", abstract = "Aiming at exploiting temporal correlations across consecutive time frames in the short-time Fourier transform (STFT) domain, multi-frame algorithms for single-microphone speech enhancement have been proposed. Typically, the multi-frame filter coefficients \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lin:2023:TRR, author = "Yi Lin and Qingyang Wang and Xincheng Yu and Zichen Zhang and Dongyue Guo and Jizhe Zhou", title = "Towards Recognition for Radio-Echo Speech in Air Traffic Control: Dataset and a Contrastive Learning Approach", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3249--3262", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3307219", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3307219", abstract = "In the air traffic control (ATC) domain, automatic speech recognition (ASR) suffers from radio speech echo, which cannot be addressed by existing echo cancellation due to auditory-oriented optimization and poor generalization ability caused by volatile \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Caviedes-Nozal:2023:STB, author = "Diego Caviedes-Nozal and Efren Fernandez-Grande", title = "Spatio-Temporal {Bayesian} Regression for Room Impulse Response Reconstruction With Spherical Waves", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3263--3277", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3306708", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3306708", abstract = "The reconstruction of sound fields in a room from a limited set of measurements is a central problem in acoustics, with relevant applications in e.g. acoustic analysis, audio, or sound field control. Conventional approaches rely on measuring the room \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hu:2023:RDP, author = "Xinyu Hu and Xiaojun Wan", title = "{RST} Discourse Parsing as Text-to-Text Generation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3278--3289", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3306710", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3306710", abstract = "Previous studies have made great advances in RST discourse parsing through specific neural frameworks or features, but they usually split the parsing process into two subtasks and heavily depended on gold discourse segmentation. In this article, we \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lei:2023:MMS, author = "Shun Lei and Yixuan Zhou and Liyang Chen and Zhiyong Wu and Xixin Wu and Shiyin Kang and Helen Meng", title = "{MSStyleTTS}: Multi-Scale Style Modeling With Hierarchical Context Information for Expressive Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3290--3303", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3301217", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3301217", abstract = "Expressive speech synthesis is crucial for many human-computer interaction scenarios, such as audiobooks, podcasts, and voice assistants. Previous works focus on predicting the style embeddings at one single scale from the information within the current \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lehmann:2023:TMP, author = "Pedro Izquierdo Lehmann and Rodrigo F. C{\'a}diz and Carlos A. Sing Long", title = "Towards Maximizing a Perceptual {{\em Sweet Spot\/}} for Spatial Sound With Loudspeakers", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3304--3319", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2022.3190729", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2022.3190729", abstract = "The {\em sweet spot\/} can be interpreted as the region where acoustic sources create a spatial auditory illusion. We study the problem of maximizing this sweet spot when reproducing a desired sound wave using an array of loudspeakers. To achieve \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhu:2023:APL, author = "Han Zhu and Dongji Gao and Gaofeng Cheng and Daniel Povey and Pengyuan Zhang and Yonghong Yan", title = "Alternative Pseudo-Labeling for Semi-Supervised Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3320--3330", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3306709", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3306709", abstract = "When labeled data is insufficient, pseudo-labeling based semi-supervised learning can significantly improve the performance of automatic speech recognition. However, pseudo-labels are often noisy, containing numerous incorrect tokens. Taking noisy labels \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:CBS, author = "Junqing Zhang and Liming Shi and Mads Gr{\ae}sb{\o}ll Christensen and Wen Zhang and Lijun Zhang and Jingdong Chen", title = "{CGMM}-Based Sound Zone Generation Using Robust Pressure Matching With {ATF} Perturbation Constraints", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3331--3345", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3306712", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3306712", abstract = "Personal sound zone (PSZ) refers to the technique that uses an array of loudspeakers and digital signal processing tools to achieve spatial soundfield control. To generate the target sound zones, this technique generally requires to know the acoustic \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Loweimi:2023:PEA, author = "Erfan Loweimi and Andrea Carmantini and Peter Bell and Steve Renals and Zoran Cvetkovic", title = "Phonetic Error Analysis Beyond Phone Error Rate", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3346--3361", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313417", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313417", abstract = "In this article, we analyse the performance of the TIMIT-based phone recognition systems beyond the overall phone error rate (PER) metric. We consider three broad phonetic classes (BPCs): affricate, diphthong, fricative, nasal, plosive, semi-vowel, vowel, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yang:2023:FHF, author = "Runxuan Yang and Yuyang Peng and Xiaolin Hu", title = "A Fast High-Fidelity Source-Filter Vocoder With Lightweight Neural Modules", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3362--3373", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3321191", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3321191", abstract = "The quality of raw audio waveform generated by a vocoder could affect various audio generative tasks. In recent years, the dominance of source-filter vocoders was greatly challenged by neural vocoders as the latter presents far superior synthesized audio \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:ISSa, author = "Yuxiang Zhang and Zhuo Li and Jingze Lu and Hua Hua and Wenchao Wang and Pengyuan Zhang", title = "The Impact of Silence on Speech Anti-Spoofing", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3374--3389", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3306711", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3306711", abstract = "The current speech anti-spoofing countermeasures (CMs) show excellent performance on specific datasets. However, removing the silence of test speech through Voice Activity Detection (VAD) can severely degrade performance. In this article, the impact of \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gonzalez:2023:AGG, author = "Philippe Gonzalez and Tommy Sonne Alstr{\o}m and Tobias May", title = "Assessing the Generalization Gap of Learning-Based Speech Enhancement Systems in Noisy and Reverberant Environments", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3390--3403", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3318965", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3318965", abstract = "The acoustic variability of noisy and reverberant speech mixtures is influenced by multiple factors, such as the spectro-temporal characteristics of the target speaker and the interfering noise, the signal-to-noise ratio (SNR) and the room \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2023:CSQ, author = "Ziyi Xu and Ziyue Zhao and Tim Fingscheidt", title = "Coded Speech Quality Measurement by a Non-Intrusive {PESQ-DNN}", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3404--3417", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3317574", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3317574", abstract = "Wideband codecs such as AMR-WB or EVS are widely used in (mobile) speech communication. Evaluation of coded speech quality is often performed subjectively by an absolute category rating (ACR) listening test. However, the ACR test is impractical for online \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:DTD, author = "Tao Li and Chenxu Hu and Jian Cong and Xinfa Zhu and Jingbei Li and Qiao Tian and Yuping Wang and Lei Xie", title = "{DiCLET-TTS}: Diffusion Model Based Cross-Lingual Emotion Transfer for Text-to-Speech --- a Study Between {English} and {Mandarin}", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3418--3430", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313413", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313413", abstract = "While the performance of cross-lingual TTS based on monolingual corpora has been significantly improved recently, generating cross-lingual speech still suffers from the foreign accent problem, leading to limited naturalness. Besides, current cross-lingual \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2023:VCM, author = "Xuexin Xu and Liang Shi and Xunquan Chen and Pingyuan Lin and Jie Lian and Jinhui Chen and Zhihong Zhang and Edwin R. Hancock", title = "Any-to-Any Voice Conversion With Multi-Layer Speaker Adaptation and Content Supervision", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3431--3445", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3306716", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3306716", abstract = "Any- to-any voice conversion can be performed among arbitrary speakers, even with a single reference utterance. Many related studies have demonstrated that it can be effectively implemented by speech representation disentanglement. However, most existing \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Du:2023:SAT, author = "Chenpeng Du and Yiwei Guo and Xie Chen and Kai Yu", title = "Speaker Adaptive Text-to-Speech With Timbre-Normalized Vector-Quantized Feature", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3446--3456", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3308374", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3308374", abstract = "Achieving high fidelity and speaker similarity in text-to-speech speaker adaptation with limited amount of data is a challenging task. Most existing methods only consider adapting to the timbre of the target speakers but fail to capture their speaking \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Atri:2023:MDS, author = "Yash Kumar Atri and Vikram Goyal and Tanmoy Chakraborty", title = "Multi-Document Summarization Using Selective Attention Span and Reinforcement Learning", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3457--3467", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3316459", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3316459", abstract = "Abstractive text summarization systems using recently improved RNN-based sequence-to-sequence architecture have shown great promise for single-document summarization. However, such neural models fail to perpetuate the performance in the multi-document \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Huang:2023:CBA, author = "Maochun Huang and Chunmei Qing and Junpeng Tan and Xiangmin Xu", title = "Context-Based Adaptive Multimodal Fusion Network for Continuous Frame-Level Sentiment Prediction", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3468--3477", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3321971", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3321971", abstract = "Recently, video sentiment computing has become the focus of research because of its benefits in many applications such as digital marketing, education, healthcare, and so on. The difficulty of video sentiment prediction mainly lies in the regression \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Schlecht:2023:DFD, author = "Sebastian J. Schlecht and Jon Fagerstr{\"o}m and Vesa V{\"a}lim{\"a}ki", title = "Decorrelation in Feedback Delay Networks", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3478--3487", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313440", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313440", abstract = "The feedback delay network (FDN) is a popular filter structure to generate artificial spatial reverberation. A common requirement for multichannel late reverberation is that the output signals are well decorrelated, as too high a correlation can lead to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lu:2023:TUM, author = "Jinliang Lu and Jiajun Zhang", title = "Towards Unified Multi-Domain Machine Translation With Mixture of Domain Experts", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3488--3498", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3316451", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3316451", abstract = "Multi- domain machine translation (MDMT) aims to construct models with mixed-domain training corpora to switch translation between different domains. Previous studies either assume that the domain information is given and leverage the domain knowledge to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hauret:2023:CEE, author = "Julien Hauret and Thomas Joubaud and V{\'e}ronique Zimpfer and {\'E}ric Bavu", title = "Configurable {EBEN}: Extreme Bandwidth Extension Network to Enhance Body-Conducted Speech Capture", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3499--3512", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313433", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313433", abstract = "This article presents a configurable version of Extreme Bandwidth Extension Network (EBEN), a Generative Adversarial Network (GAN) designed to improve audio captured with body-conduction microphones. We show that although these microphones significantly \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Peng:2023:TSB, author = "Wanli Peng and Sheng Li and Zhenxing Qian and Xinpeng Zhang", title = "Text Steganalysis Based on Hierarchical Supervised Learning and Dual Attention Mechanism", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3513--3526", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3319975", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3319975", abstract = "Recent methods with deep neural networks for text steganalysis have succeeded in mining various feature representations. However, a limited number of studies have explicitly analyzed potential security issues of generative text steganography. Furthermore, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2023:ICI, author = "Lin Xu and Qixian Zhou and Jinlan Fu and See-Kiong Ng", title = "{CET2}: Modelling Topic Transitions for Coherent and Engaging Knowledge-Grounded Conversations", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3527--3536", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313418", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313418", abstract = "Knowledge- grounded dialogue systems aim to generate coherent and engaging responses based on the dialogue contexts and selected external knowledge. Previous knowledge selection methods tend to rely too heavily on the dialogue contexts or over-emphasize \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Neo:2023:SCU, author = "Vincent W. Neo and Christine Evers and Stephan Weiss and Patrick A. Naylor", title = "Signal Compaction Using Polynomial {EVD} for Spherical Array Processing With Applications", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3537--3549", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313441", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313441", abstract = "Multi- channel signals captured by spatially separated sensors often contain a high level of data redundancy. A compact signal representation enables more efficient storage and processing, which has been exploited for data compression, noise reduction, and \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Enzner:2023:HFR, author = "Gerald Enzner and Svantje Voit", title = "Hybrid- Frequency-Resolution Adaptive {Kalman} Filter for Online Identification of Long Acoustic Responses With Low Input-Output Latency", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3550--3563", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313435", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313435", abstract = "Online acoustic system identification is one of the most challenging tasks for adaptive filters. Along with the desired accuracy in applications such as acoustic echo cancellation, it bears requirements of accommodating high-order systems \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gao:2023:MSL, author = "Shang Gao and Maoshen Jia and Dingding Yao and Jing Wang", title = "Multi-Source Localization Using Optimized Time-Frequency Representation and Sparsity Component Analysis", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3564--3578", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3316450", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3316450", abstract = "This article aims to address the multi-source localization problem by exploiting the sparsity of the speech signal in the time-frequency domain, where the challenge mainly lies in extracting the sparse component. An optimized time-frequency representation \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{He:2023:DMA, author = "Qi He and Mingjie Gao and Ka Fai Cedric Yiu and Sven Nordholm", title = "Distributed Microphone Array Localization Problem via {SDP-SOCP} Method", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3579--3588", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313437", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313437", abstract = "In multimedia applications, it is common to employ acoustic sensors collectively to enhance signals and to locate sound sources. A direct problem can be formulated to locate sound sources from a set of known sensors. In order to form the acoustic sensor \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sawada:2023:MFF, author = "Hiroshi Sawada and Rintaro Ikeshita and Keisuke Kinoshita and Tomohiro Nakatani", title = "Multi-Frame Full-Rank Spatial Covariance Analysis for Underdetermined Blind Source Separation and Dereverberation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3589--3602", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313446", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313446", abstract = "Full- rank spatial covariance analysis (FCA) is a technique for blind source separation (BSS), and can be applied to underdetermined situations where the sources outnumber the microphones. This paper proposes multi-frame FCA as an extension of FCA to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chang:2023:JBJ, author = "Hongyang Chang and Hongfei Xu and Josef van Genabith and Deyi Xiong and Hongying Zan", title = "{JoinER-BART}: Joint Entity and Relation Extraction With Constrained Decoding, Representation Reuse and Fusion", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3603--3616", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3310879", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3310879", abstract = "Joint Entity and Relation Extraction (JERE) is an important research direction in Information Extraction (IE). Given the surprising performance with fine-tuning of pre-trained BERT in a wide range of NLP tasks, nowadays most studies for JERE are based on \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Huang:2023:SSA, author = "Xinqi Huang and Yingsong Li and Yuriy Zakharov and Yongchun Miao and Zhixiang Huang", title = "Squared Sine Adaptive Algorithm and Its Performance Analysis", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3617--3628", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313408", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313408", abstract = "The squared sine adaptive (SSA) algorithm is presented for identification scenarios, such as acoustic-echo cancellation (AEC) applications, in non-Gaussian environments. To devise the SSA algorithm, a novel cost function is constructed by exerting a \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:GUS, author = "Andong Li and Guochen Yu and Chengshi Zheng and Wenzhe Liu and Xiaodong Li", title = "A General Unfolding Speech Enhancement Method Motivated by {Taylor}'s Theorem", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3629--3646", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313442", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313442", abstract = "While deep neural networks have facilitated significant advancements in the field of speech enhancement, most existing methods are developed following either empirical or relatively blind criteria, lacking adequate guidelines in pipeline design. Inspired \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gu:2023:DCF, author = "Bin Gu and Jie Zhang and Wu Guo", title = "A Dynamic Convolution Framework for Session-Independent Speaker Embedding Learning", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3647--3658", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313431", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313431", abstract = "Speaker verification (SV) has suffered from session variability in complex acoustic scenarios, and learning session independent speaker representations remains a challenging problem. To tackle this, we propose a dynamic convolution framework for SV in \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zeng:2023:DLR, author = "Daojian Zeng and Chao Zhao and Chao Jiang and Jianling Zhu and Jianhua Dai", title = "Document-Level Relation Extraction With Context Guided Mention Integration and Inter-Pair Reasoning", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3659--3666", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3316454", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3316454", abstract = "Document- level Relation Extraction (DRE) aims to recognize the relations between two entities. The entity may correspond to multiple mentions that span beyond the sentence boundary. Few previous studies have investigated the mention integration, which may \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:MSS, author = "Lu Li and Maoshen Jia and Jing Wang and Ruiyuan Cao", title = "Multiple-Speech-Source {DOA} Estimation Based on Single-Source Cluster Detection", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3667--3680", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3321213", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3321213", abstract = "This study proposes multiple-speech-source direction -of-arrival (DOA) estimation based on the distribution characteristic of the time-frequency (TF) point dominated by a single-source component (i.e., single-source point, SSP). By exploring the TF \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Miao:2023:SAU, author = "Xiaoxiao Miao and Xin Wang and Erica Cooper and Junichi Yamagishi and Natalia Tomashenko", title = "Speaker Anonymization Using Orthogonal {Householder} Neural Network", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3681--3695", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313429", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313429", abstract = "Speaker anonymization aims to conceal a speaker's identity while preserving content information in speech. Current mainstream neural-network speaker anonymization systems disentangle speech into prosody-related, content, and speaker \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xue:2023:DLF, author = "Zhengshan Xue and Xiaolei Zhang and Tingxun Shi and Deyi Xiong", title = "{DetTrans}: a Lightweight Framework to Detect and Translate Noisy Inputs Simultaneously", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3696--3705", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3284513", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3284513", abstract = "Neural machine translation (NMT) systems trained on clean data usually suffer from performance degradation when translating noisy inputs. Existing works attempt to improve the robustness of NMT normally via data augmentation, where synthetic noisy data \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2023:PDF, author = "Chang Liu and Zhen-Hua Ling and Ling-Hui Chen", title = "Pronunciation Dictionary-Free Multilingual Speech Synthesis Using Learned Phonetic Representations", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3706--3716", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313424", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313424", abstract = "This article presents a multilingual speech synthesis approach that leverages learned phonetic representations to eliminate the need for pronunciation dictionaries in target languages. The learned phonetic representations consist of unsupervised phonetic \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yoneyama:2023:HFP, author = "Reo Yoneyama and Yi-Chiao Wu and Tomoki Toda", title = "High-Fidelity and Pitch-Controllable Neural Vocoder Based on Unified Source-Filter Networks", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3717--3729", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313410", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313410", abstract = "We introduce unified source-filter generative adversarial networks (uSFGAN), a waveform generative model conditioned on acoustic features, which represents the source-filter architecture in a generator network. Unlike the previous neural-based source-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Thaleiser:2023:BPM, author = "Stefan Thaleiser and Gerald Enzner", title = "Binaural-Projection Multichannel {Wiener} Filter for Cue-Preserving Binaural Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3730--3745", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3317569", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3317569", abstract = "Former research in binaural speech enhancement has demonstrated a demand of binaural cue preservation beyond the requirements of noise suppression and speech quality. The binaural state-of-the-art is frequently grouped into the class of spatio-temporal \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2023:DAD, author = "Yixin Wang and Wei Wei and Xiangming Gu and Xiaohong Guan and Ye Wang", title = "Disentangled Adversarial Domain Adaptation for Phonation Mode Detection in Singing and Speech", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3746--3759", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3317568", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3317568", abstract = "Phonation mode detection predicts phonation modes and their temporal boundaries in singing and speech, holding promise for characterizing voice quality and vocal health. However, it is very challenging due to the domain disparities between training data \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2023:IFT, author = "Yixuan Zhang and Heming Wang and DeLiang Wang", title = "{$ F0 $} Estimation and Voicing Detection With Cascade Architecture in Noisy Speech", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3760--3770", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313427", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313427", abstract = "As a fundamental problem in speech processing, pitch tracking has been studied for decades. While strong performance has been achieved on clean speech, pitch tracking in noisy speech is still challenging. Severe non-stationary noises not only corrupt the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2023:TTB, author = "Zhengdao Zhao and Yuhua Wang and Guang Shen and Yuezhu Xu and Jiayuan Zhang", title = "{TDFNet}: Transformer-Based Deep-Scale Fusion Network for Multimodal Emotion Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3771--3782", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3316458", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3316458", abstract = "As deep learning technology research continues to progress, artificial intelligence technology is gradually empowering various fields. To achieve a more natural human-computer interaction experience, how to accurately recognize emotional state of speech \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Arend:2023:MCT, author = "Johannes M. Arend and Christoph P{\"o}rschmann and Stefan Weinzierl and Fabian Brinkmann", title = "Magnitude-Corrected and Time-Aligned Interpolation of Head-Related Transfer Functions", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3783--3799", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313908", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313908", abstract = "Head- related transfer functions (HRTFs) are essential for virtual acoustic realities because they contain all cues for localizing sound sources in three-dimensional space. Acoustic measurements are one way to obtain high-quality HRTFs. To reduce \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Raj:2023:SAT, author = "Desh Raj and Daniel Povey and Sanjeev Khudanpur", title = "{SURT} 2.0: Advances in Transducer-Based Multi-Talker Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3800--3813", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3318398", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3318398", abstract = "The Streaming Unmixing and Recognition Transducer (SURT) model was proposed recently as an end-to-end approach for continuous, streaming, multi-talker speech recognition (ASR). Despite impressive results on multi-turn meetings, SURT has notable \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{An:2023:GVS, author = "Jiaming An and Zixiang Ding and Ke Li and Rui Xia", title = "Global-View and Speaker-Aware Emotion Cause Extraction in Conversations", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3814--3823", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3319990", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3319990", abstract = "Emotion cause extraction in conversations, the task of recognizing and extracting the causes behind the emotions in a conversation, is a new and under-explored task. It was previously treated as an utterance-level task, that can only extract cause of one \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lin:2023:CCI, author = "Yuqin Lin and Longbiao Wang and Yanbing Yang and Jianwu Dang", title = "{CFDRN}: a Cognition-Inspired Feature Decomposition and Recombination Network for Dysarthric Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3824--3836", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3319276", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3319276", abstract = "As an essential technology in human-computer interactions, automatic speech recognition (ASR) ensures a convenient life for healthy people; however, people with speech disorders, who truly need support from such a technology, have experienced \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Blandin:2023:CSA, author = "R{\'e}mi Blandin and Simon Stone and Ang{\'e}lique Remacle and Vincent Didone and Peter Birkholz", title = "A Comparative Study of {$3$D} and {$1$D} Acoustic Simulations of the Higher Frequencies of Speech", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3837--3847", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313423", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313423", abstract = "Articulatory synthesis generates speech sounds by simulating the physical phenomena involved in speech production. The accuracy of the physical modelling is expected to affect the naturalness of the synthesis: the more realistic the description is, the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2023:TRA, author = "Qing Wang and Jixun Yao and Li Zhang and Pengcheng Guo and Lei Xie", title = "Timbre-Reserved Adversarial Attack in Speaker Identification", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3848--3858", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3306714", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3306714", abstract = "As a type of biometric identification, speaker identification (SID) systems face various attacks. Spoofing attacks imitate target speakers' timbre, while adversarial attacks confuse SID systems with well-designed perturbations. Spoofing mimics \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:PTT, author = "Yachao Li and Junhui Li and Jing Jiang and Shimin Tao and Hao Yang and Min Zhang", title = "P-Transformer: Towards Better Document-to-Document Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3859--3870", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313445", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313445", abstract = "Directly training a document-to-document (Doc2Doc) neural machine translation (NMT) via Transformer from scratch, especially on small datasets, usually fails to converge. Our dedicated probing tasks show that (1) both the absolute position and relative \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xie:2023:NNV, author = "Chao Xie and Tomoki Toda", title = "Noisy-to-Noisy Voice Conversion Under Variations of Noisy Condition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3871--3882", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313426", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313426", abstract = "Voiceconversion (VC) refers to the transformation of the speaker identity of a speech to the target one without altering the linguistic content. As recent VC techniques have made significant progress, implementing them in real-world scenarios is also \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2023:MVH, author = "Zhichao Wang and Xinsheng Wang and Qicong Xie and Tao Li and Lei Xie and Qiao Tian and Yuping Wang", title = "{MSM-VC}: High-Fidelity Source Style Transfer for Non-Parallel Voice Conversion by Multi-Scale Style Modeling", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3883--3895", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313414", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313414", abstract = "In addition to conveying the linguistic content from source speech to converted speech, maintaining the speaking style of source speech also plays an important role in the voice conversion (VC) task, which is essential in many scenarios with highly \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2023:MGE, author = "Yilin Zhao and Hai Zhao and Sufeng Duan", title = "Multi-Grained Evidence Inference for Multi-Choice Reading Comprehension", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3896--3907", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313885", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313885", abstract = "Multi- choice Machine Reading Comprehension (MRC) is a major and challenging task for machines to answer questions according to provided options. Answers in multi-choice MRC cannot be directly extracted in the given passages, and essentially require \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Du:2023:SSC, author = "Ye-Qian Du and Jie Zhang and Xin Fang and Ming-Hui Wu and Zhou-Wang Yang", title = "A Semi-Supervised Complementary Joint Training Approach for Low-Resource Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3908--3921", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313434", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313434", abstract = "Both unpaired speech and text have shown to be beneficial for low-resource automatic speech recognition (ASR), which, however were either separately used for pre-training, self-training and language model (LM) training, or jointly used for designing \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2023:ALS, author = "Changheng Li and Richard C. Hendriks", title = "Alternating Least-Squares-Based Microphone Array Parameter Estimation for a Single-Source Reverberant and Noisy Acoustic Scenario", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3922--3934", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3306713", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3306713", abstract = "Acoustic- scene-related parameters such as relative transfer functions (RTFs) and power spectral densities (PSDs) of the target source, late reverberation and ambient noise are essential for microphone array signal processing and are challenging to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2023:LPC, author = "Kun Zhou and Yuanhang Zhou and Wayne Xin Zhao and Ji-Rong Wen", title = "Learning to Perturb for Contrastive Learning of Unsupervised Sentence Representations", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3935--3944", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3304485", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3304485", abstract = "Recently, contrastive learning has been shown effective in fine-tuning pre-trained language models (PLM) to learn sentence representations, which incorporates perturbations into unlabeled sentences to augment semantically related positive examples for \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gotz:2023:CSM, author = "Georg G{\"o}tz and Sebastian J. Schlecht and Ville Pulkki", title = "Common-Slope Modeling of Late Reverberation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3945--3957", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3317572", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3317572", abstract = "The decaying sound field in rooms is typically described by energy decay functions (EDFs). Late reverberation can deviate considerably from the ideal diffuse field, for example, in multiple connected rooms or non-uniform absorption material distributions. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2023:MLC, author = "Guanhua Chen and Runzhe Zhan and Derek F. Wong and Lidia S. Chao", title = "Multi-Level Curriculum Learning for Multi-Turn Dialogue Generation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3958--3967", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3322583", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3322583", abstract = "Since deep learning is the dominant paradigm in the multi-turn dialogue generation task, large-scale training data is the key factor affecting the model performance. To make full use of the training data, the existing work directly applied curriculum \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chuang:2023:MGM, author = "Yun-Yen Chuang and Hung-Min Hsu and Kevin Lin and Ray-I. Chang and Hung-Yi Lee", title = "{MetaEx-GAN}: Meta Exploration to Improve Natural Language Generation via Generative Adversarial Networks", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3968--3980", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3317571", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3317571", abstract = "Generative Adversarial Networks (GANs) have been popularly researched in natural language generation, so-called Language GANs. Existing works adopt reinforcement learning (RL) based methods such as policy gradients for training Language GANs. The previous \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tong:2023:QEB, author = "Chuxuan Tong and Xi Zheng and Jianhua Li and Xingjun Ma and Longxiang Gao and Yong Xiang", title = "Query-Efficient Black-{Box} Adversarial Attacks on Automatic Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3981--3992", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3304476", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3304476", abstract = "The susceptibility of Deep Neural Networks (DNNs) to adversarial attacks has raised concerns regarding their practical applications in real-world scenarios. Although the vulnerability of DNNs to adversarial attacks has been extensively studied in the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2023:HSM, author = "Xixin Wu and Hui Lu and Kun Li and Zhiyong Wu and Xunying Liu and Helen Meng", title = "Hiformer: Sequence Modeling Networks With Hierarchical Attention Mechanisms", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "3993--4003", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313428", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313428", abstract = "The attention-based encoder-decoder structure, such as the Transformer, has achieved state-of-the-art performance on various sequence modeling tasks, e.g., machine translation (MT) and automatic speech recognition (ASR), benefited from the superior \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2023:DMP, author = "Ante Wang and Linfeng Song and Lifeng Jin and Junfeng Yao and Haitao Mi and Chen Lin and Jinsong Su and Dong Yu", title = "{D$^2$PSG}: Multi-Party Dialogue Discourse Parsing as Sequence Generation", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "4004--4013", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3313415", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313415", abstract = "Conversational discourse analysis aims to extract the interactions between dialogue turns, which is crucial for modeling complex multi-party dialogues. As the benchmarks are still limited in size and human annotations are costly, the current standard \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gao:2023:BST, author = "Nan Gao and Yongjian Wang and Peng Chen and Jijun Tang", title = "Boosting Short Text Classification by Solving the {OOV} Problem", journal = j-IEEE-ACM-TASLP, volume = "31", number = "??", pages = "4014--4024", year = "2023", DOI = "https://doi.org/10.1109/TASLP.2023.3316422", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:06:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3316422", abstract = "In the field of natural language processing, text classification has received a lot of attention. Compared with long texts, short texts have fewer words and lack contextual semantic information. Existing approaches enrich short text information by linking \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2024:SAS, author = "Jin Chu Wu and Raghu N. Kacker", title = "Statistical Analysis for Speaker Recognition Evaluation With Data Dependence and Three Score Distributions", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1--14", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3313447", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3313447", abstract = "The speaker recognition evaluation is conducted in a framework in which three score distributions and two decision thresholds are employed, and the statistic of interest is an average of the two weighted sums \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2024:OAN, author = "Yongwei Zhou and Junwei Bao and Youzheng Wu and Xiaodong He and Tiejun Zhao", title = "Operation-Augmented Numerical Reasoning for Question Answering", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "15--28", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3316448", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3316448", abstract = "Question answering requiring numerical reasoning, which generally involves symbolic operations such as sorting, counting, and addition, is a challenging task. To address such a problem, existing mixture-of-experts \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Purushothaman:2024:SDF, author = "Anurenjan Purushothaman and Debottam Dutta and Rohit Kumar and Sriram Ganapathy", title = "Speech Dereverberation With Frequency Domain Autoregressive Modeling", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "29--38", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3317570", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3317570", abstract = "Speech applications in far-field real world settings often deal with signals that are corrupted by reverberation. The task of dereverberation constitutes an important step to improve the audible quality and to reduce the \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Qu:2024:DPR, author = "Leyuan Qu and Taihao Li and Cornelius Weber and Theresa Pekarek-Rosin and Fuji Ren and Stefan Wermter", title = "Disentangling Prosody Representations With Unsupervised Speech Reconstruction", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "39--54", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3320864", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3320864", abstract = "Human speech can be characterized by different components, including semantic content, speaker identity and prosodic information. Significant progress has been made in disentangling representations for \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pedersen:2024:DDN, author = "Mathias Bach Pedersen and S{\o}ren Holdt Jensen and Zheng-Hua Tan and Jesper Jensen", title = "Data-Driven Non-Intrusive Speech Intelligibility Prediction Using Speech Presence Probability", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "55--67", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3321964", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3321964", abstract = "Time consuming Speech Intelligibility (SI) listening tests with human subjects can be replaced by algorithmic SI predictors. In recent years, data-driven SI predictors have been showing promising results. A major limiting \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hou:2024:CSE, author = "Yuanbo Hou and Bo Kang and Andrew Mitchell and Wenwu Wang and Jian Kang and Dick Botteldooren", title = "Cooperative Scene-Event Modelling for Acoustic Scene Classification", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "68--82", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3323135", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3323135", abstract = "Acoustic scene classification (ASC) can be helpful for creating context awareness for intelligent robots. Humans naturally use the relations between acoustic scenes (AS) and audio events (AE) to understand and \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jiang:2024:ESD, author = "Xiaotong Jiang and Peiwen You and Chen Chen and Zhongqing Wang and Guodong Zhou", title = "Exploring Scope Detection for Aspect-Based Sentiment Analysis", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "83--94", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3323136", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3323136", abstract = "Aspect- based sentiment analysis (ABSA) aims to extract the aspect terms from review text, and to predict the polarity towards the aspect term. Although neural models have achieved competitive results, there are still \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2024:BSQ, author = "Xuenan Xu and Zeyu Xie and Mengyue Wu and Kai Yu", title = "Beyond the Status Quo: a Contemporary Survey of Advances and Challenges in Audio Captioning", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "95--112", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3321968", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3321968", abstract = "Automated audio captioning (AAC), a task that mimics human perception as well as innovatively links audio processing and natural language processing, has overseen much progress over the last few years. AAC \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Miotello:2024:DPB, author = "Federico Miotello and Mirco Pezzoli and Luca Comanducci and Fabio Antonacci and Augusto Sarti", title = "Deep Prior-Based Audio Inpainting Using Multi-Resolution Harmonic Convolutional Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "113--123", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3324556", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3324556", abstract = "In this manuscript, we propose a novel method to perform audio inpainting, i.e., the restoration of audio signals presenting multiple missing parts. Audio inpainting can be interpreted in the context of inverse problems as \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Stanciu:2024:DBW, author = "Cristian-Lucian Stanciu and Jacob Benesty and Constantin Paleologu and Ruxandra-Liana Costea and Laura-Maria Dogariu and Silviu Ciochin{\u{a}}", title = "Decomposition-Based {Wiener} Filter Using the {Kronecker} Product and Conjugate Gradient Method", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "124--138", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3325136", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3325136", abstract = "The identification of long-length impulse responses represents a challenge in the context of many applications, like echo cancellation. Recently, the problem has been addressed in the framework of low-rank systems, \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2024:ANG, author = "Huiyao Chen and Yueheng Sun and Meishan Zhang and Min Zhang", title = "Automatic Noise Generation and Reduction for Text Classification", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "139--150", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3325135", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3325135", abstract = "Label noise is an important issue in machine learning, which might lead to negative influences on various tasks. Given that real benchmarks for evaluation of noise reduction methods are limited, plenty of studies construct \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xu:2024:MCG, author = "Jiaming Xu and Jian Cui and Yunzhe Hao and Bo Xu", title = "Multi-Cue Guided Semi-Supervised Learning Toward Target Speaker Separation in Real Environments", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "151--163", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3323856", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3323856", abstract = "To solve the cocktail party problem in real multi-talker environments, this article proposed a multi-cue guided semi-supervised target speaker separation method (MuSS). Our MuSS integrates three target speaker-related \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xiang:2024:TSD, author = "Yang Xiang and Jesper Lisby H{\o}jvang and Morten H{\o}jfeldt Rasmussen and Mads Gr{\ae}sb{\o}ll Christensen", title = "A Two-Stage Deep Representation Learning-Based Speech Enhancement Method Using Variational Autoencoder and Adversarial Training", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "164--177", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3321975", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3321975", abstract = "This article focuses on leveraging deep representation learning (DRL) for speech enhancement (SE). In general, the performance of the deep neural network (DNN) is heavily dependent on the learning of data representation. \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2024:CLT, author = "Xiao Li and Ruirui Liu and Huichou Huang and Qingyao Wu", title = "Contrastive Learning for Target Speaker Extraction With Attention-Based Fusion", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "178--188", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3324550", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3324550", abstract = "Given a reference speech clip from the target speaker, Target Speaker Extraction (TSE) is a challenging task that involves extracting the signal of the target speaker from a multi-speaker environment. TSE networks \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liang:2024:ELR, author = "Xiaobo Liang and Runze Mao and Lijun Wu and Juntao Li and Min Zhang and Qing Li", title = "Enhancing Low-Resource {NLP} by Consistency Training With Data and Model Perturbations", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "189--199", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3325970", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3325970", abstract = "Natural language processing (NLP) has recently shown significant progress in rich-resource scenarios. However, it is much less effective for low-resource scenarios due to the model easily overfitting to limited training data \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lu:2024:CXP, author = "Haisheng Lu and Jiangnan Liang and Chuang Shi", title = "Comments on ``{Primary}-Ambient Extraction Using Ambient Spectrum Estimation for Immersive Spatial Audio Reproduction''", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "200--202", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3328286", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", note = "See \cite{He:2015:PAE}.", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3328286", abstract = "In the above paper, He et al. propose a primary-ambient extraction method using ambient phase estimation with a sparsity constraint (APES). The primary-ambient extraction problem is formulated as a \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Drgas:2024:DPN, author = "Szymon Drgas and Lars Bramsl{\o}w and Archontis Politis and Gaurav Naithani and Tuomas Virtanen", title = "Dynamic Processing Neural Network Architecture for Hearing Loss Compensation", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "203--214", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3328285", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3328285", abstract = "This paper proposes neural networks for compensating sensorineural hearing loss. The aim of the hearing loss compensation task is to transform a speech signal to increase speech intelligibility after further \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gelderblom:2024:PPO, author = "Femke B. Gelderblom and Tron Vedul Tronstad and Torbj{\o}rn Svendsen and Tor Andre Myrvoll", title = "On the Predictive Power of Objective Intelligibility Metrics for the Subjective Performance of Deep Complex Convolutional Recurrent Speech Enhancement Networks", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "215--226", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3329378", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3329378", abstract = "Speech enhancement (SE) systems aim to improve the quality and intelligibility of degraded speech signals obtained from far-field microphones. Subjective evaluation of the intelligibility performance of these SE \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Haubner:2024:EED, author = "Thomas Haubner and Andreas Brendel and Walter Kellermann", title = "End-to-End Deep Learning-Based Adaptation Control for Linear Acoustic Echo Cancellation", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "227--238", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3325923", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3325923", abstract = "The attenuation of acoustic loudspeaker echoes remains to be one of the open challenges to achieve pleasant full-duplex hands free speech communication. In many modern signal enhancement interfaces, this problem is \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jiang:2024:OGT, author = "Congcong Jiang and Tieyun Qian and Bing Liu", title = "One General Teacher for Multi-Data Multi-Task: a New Knowledge Distillation Framework for Discourse Relation Analysis", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "239--249", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3328289", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3328289", abstract = "Automatically identifying the discourse relations can help many downstream NLP tasks such as reading comprehension and machine translation. It can be categorized into explicit and implicit discourse \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Nayem:2024:ABS, author = "Khandokar Md. Nayem and Donald S. Williamson", title = "Attention-Based Speech Enhancement Using Human Quality Perception Modeling", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "250--260", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3328282", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3328282", abstract = "Perceptually- inspired objective functions such as the perceptual evaluation of speech quality (PESQ), signal-to-distortion ratio (SDR), and short-time objective intelligibility (STOI), have recently been used to \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2024:CQE, author = "Ying Zhang and Fandong Meng and Yufeng Chen and Jinan Xu and Jie Zhou", title = "Complex Question Enhanced Transfer Learning for Zero-Shot Joint Information Extraction", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "261--275", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3304481", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3304481", abstract = "Zero- shot information extraction (IE) tasks have attracted great attention recently. However, how to jointly model multiple IE tasks in the zero-shot scenario is still an open question. In this article, we focus on zero-shot \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yan:2024:DOM, author = "Jingsong Yan and Piji Li and Haibin Chen and Junhao Zheng and Qianli Ma", title = "Does the Order Matter? {A} Random Generative Way to Learn Label Hierarchy for Hierarchical Text Classification", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "276--285", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3329374", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3329374", abstract = "Hierarchical Text Classification (HTC) is an essential and challenging task due to the difficulty of modeling label hierarchy. Recent generative methods have achieved state-of-the-art performance by flattening the \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Paraskevopoulos:2024:SEU, author = "Georgios Paraskevopoulos and Theodoros Kouzelis and Georgios Rouvalis and Athanasios Katsamanis and Vassilis Katsouros and Alexandros Potamianos", title = "Sample-Efficient Unsupervised Domain Adaptation of Speech Recognition Systems: a Case Study for Modern {Greek}", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "286--299", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3328280", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3328280", abstract = "Modern speech recognition systems exhibit rapid performance degradation under domain shift. This issue is especially prevalent in data-scarce settings, such as low-resource languages, where the diversity of \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Accolti:2024:URA, author = "Ernesto Accolti and Javier Gimenez and Michael Vorl{\"a}nder", title = "Uncertainties of Room Acoustics Simulation Due to Directivity Data of Musical Instruments", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "300--309", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3330117", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3330117", abstract = "Simulationsand auralization methods in the field of room acoustics require the directivity of sound sources in third-octave frequency bands, which simplifies the calculation algorithms but introduces uncertainty. However, \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Masuyama:2024:CRD, author = "Yoshiki Masuyama and Kouei Yamaoka and Yuma Kinoshita and Taishi Nakashima and Nobutaka Ono", title = "Causal and Relaxed-Distortionless Response Beamforming for Online Target Source Extraction", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "310--324", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3329377", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3329377", abstract = "In this paper, we propose a low-latency beamforming method for target source extraction. Beamforming has been performed in the time-frequency domain and achieved promising results in offline applications. \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Prabhavalkar:2024:EES, author = "Rohit Prabhavalkar and Takaaki Hori and Tara N. Sainath and Ralf Schl{\"u}ter and Shinji Watanabe", title = "End-to-End Speech Recognition: a Survey", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "325--351", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3328283", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3328283", abstract = "In the last decade of automatic speech recognition (ASR) research, the introduction of deep learning has brought considerable reductions in word error rate of more than 50\% relative, compared to modeling \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2024:JQJ, author = "Yun Zhao and Dexi Liu and Changxuan Wan and Xiping Liu and Jian-yun Nie and Jiaming Liu", title = "{JMS-QA}: a Joint Hierarchical Architecture for Mental Health Question Answering", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "352--363", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3329295", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3329295", abstract = "With the increasing scale of mental health problems in modern society, the scarcity of professional assistance is alarming, especially in developing countries. To address this, some online forums have emerged to \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ni:2024:DRD, author = "Shiwen Ni and Jiawen Li and Min Yang and Hung-Yu Kao", title = "{DropAttack}: a Random Dropped Weight Attack Adversarial Training for Natural Language Understanding", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "364--373", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3330613", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3330613", abstract = "Adversarial training has been proven to be a powerful regularization technique to improve language models. In this work, we propose a novel random \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhu:2024:BCI, author = "Tiantian Zhu and Yang Qin and Ming Feng and Qingcai Chen and Baotian Hu and Yang Xiang", title = "{BioPRO}: Context-Infused Prompt Learning for Biomedical Entity Linking", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "374--385", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3331149", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3331149", abstract = "Recent research tends to address the biomedical entity linking problem in a unified framework solely based on surface form matching between mentions and entities. Specifically, these methods focus on addressing \ldots (More)", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2024:MLI, author = "Jiapu Wang and Boyue Wang and Junbin Gao and Simin Hu and Yongli Hu and Baocai Yin", title = "Multi-Level Interaction Based Knowledge Graph Completion", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "386--396", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3331121", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3331121", abstract = "With the continuous emergence of new knowledge, Knowledge Graph (KG) typically suffers from the incompleteness problem, hindering the performance of downstream applications. Thus, Knowledge Graph Completion (KGC) has attracted considerable attention. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2024:ERF, author = "Qiangqiang Zhang and Dongyuan Lin and Yingying Xiao and Yunfei Zheng and Shiyuan Wang", title = "Error Reused Filtered-{$X$} Least Mean Square Algorithm for Active Noise Control", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "397--412", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3330077", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3330077", abstract = "The conventional active noise control (ANC) system relies on the error-correction learning to design the adaptive controller. However, as the residual noise, the correction error is discarded after each iteration and is still not a perfect input to the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jin:2024:PAD, author = "Zengrui Jin and Mengzhe Geng and Jiajun Deng and Tianzi Wang and Shujie Hu and Guinan Li and Xunying Liu", title = "Personalized Adversarial Data Augmentation for Dysarthric and Elderly Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "413--429", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3323888", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3323888", abstract = "Despite the rapid progress of automatic speech recognition (ASR) technologies targeting normal speech, accurate recognition of dysarthric and elderly speech remains a highly challenging task to date. It is difficult to collect large quantities of such \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kong:2024:AES, author = "Jun Kong and Jin Wang and Xuejie Zhang", title = "Adaptive Ensemble Self-Distillation With Consistent Gradients for Fast Inference of Pretrained Language Models", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "430--442", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3331080", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3331080", abstract = "Conditional computation algorithms, e.g., the early exiting (EE) strategy, can accelerate the inference of pretrained language models (PLMs) by exiting shallow layers without calculating the entire model. In addition to the adaptive inference of EE \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kitic:2024:BIA, author = "Sr{\dbar}an Kiti{\'c} and J{\'e}r{\^o}me Daniel", title = "Blind Identification of Ambisonic Reduced Room Impulse Response", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "443--458", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3332546", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3332546", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Shao:2024:DIM, author = "Qijie Shao and Pengcheng Guo and Jinghao Yan and Pengfei Hu and Lei Xie", title = "Decoupling and Interacting Multi-Task Learning Network for Joint Speech and Accent Recognition", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "459--470", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3332542", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3332542", abstract = "Accents pose significant challenges for speech recognition systems. Although joint automatic speech recognition (ASR) and accent recognition (AR) training has been proven effective in handling multi-accent scenarios, current multi-task ASR-AR approaches \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhu:2024:BCD, author = "Han Zhu and Gaofeng Cheng and Jindong Wang and Wenxin Hou and Pengyuan Zhang and Yonghong Yan", title = "Boosting Cross-Domain Speech Recognition With Self-Supervision", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "471--485", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3301230", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3301230", abstract = "The cross-domain performance of automatic speech recognition (ASR) could be severely hampered due to the mismatch between training and testing distributions. Since the target domain usually lacks labeled data, and domain shifts exist at acoustic and \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2024:GSL, author = "Yile Wang and Yue Zhang and Peng Li and Yang Liu", title = "Gradual Syntactic Label Replacement for Language Model Pre-Training", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "486--496", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3331096", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3331096", abstract = "Pre- training serves as a foundation of recent NLP models, where language modeling tasks are performed over large texts. Typical models like BERT and GPT take the corpus as a whole and treat each word equally for language modeling. However, recent works \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ma:2024:CSD, author = "Penghui Ma and Jianfeng Li and Jingjing Pan and Xiaofei Zhang and Roberto Gil-Pita", title = "Coherent Signal {DOA} Estimation With Coprime Array: Exploiting Signal Subspace Reconstructing Strategy", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "497--508", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3334482", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3334482", abstract = "Coprime array possesses a larger array aperture and element spacing compared with the conventional uniform linear array (ULA) for the equivalent number of sensors, attracting considerable scholarly attention. However, the direction of arrival (DOA) \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hamel:2024:FIA, author = "Emma Hamel and Nickvash Kani", title = "Factors That Influence Automatic Recognition of {African-American} Vernacular {English} in Machine-Learning Models", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "509--516", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3331139", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3331139", abstract = "Racial bias is a well-documented problem in natural language processing (NLP). The dialectal language used by marginalized groups is often misclassified or mischaracterized by language models, which in turn can further disenfranchise these populations. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2024:JMC, author = "Jingbei Li and Sipan Li and Ping Chen and Luwen Zhang and Yi Meng and Zhiyong Wu and Helen Meng and Qiao Tian and Yuping Wang and Yuxuan Wang", title = "Joint Multiscale Cross-Lingual Speaking Style Transfer With Bidirectional Attention Mechanism for Automatic Dubbing", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "517--528", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3331813", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3331813", abstract = "Automatic dubbing, which generates a corresponding version of the input speech in another language, can be widely utilized in many real-world scenarios, such as video and game localization. In addition to synthesizing the translated scripts, automatic \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Han:2024:SSL, author = "Bing Han and Zhengyang Chen and Yanmin Qian", title = "Self-Supervised Learning With Cluster-Aware-{DINO} for High-Performance Robust Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "529--541", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3331949", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3331949", abstract = "The automatic speaker verification task has achieved great success using deep learning approaches with a large-scale, manually annotated dataset. However, collecting a significant amount of well-labeled data for system building is very difficult and \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tesch:2024:MCS, author = "Kristina Tesch and Timo Gerkmann", title = "Multi-Channel Speech Separation Using Spatially Selective Deep Non-Linear Filters", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "542--553", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3334101", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3334101", abstract = "In a multi-channel separation task with multiple speakers, we aim to recover all individual speech signals from the mixture. In contrast to single-channel approaches, which rely on the different spectro-temporal characteristics of the speech signals, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Pei:2024:GFM, author = "Hao-Chen Pei and Hao Fang and Xin Luo and Xin-Shun Xu", title = "{Gradformer}: a Framework for Multi-Aspect Multi-Granularity Pronunciation Assessment", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "554--563", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3335807", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3335807", abstract = "Automatic pronunciation assessment is an indispensable technology in computer-assisted pronunciation training systems. To further evaluate the quality of pronunciation, multi-task learning with simultaneous output of multi-granularity and multi-aspect has \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sharma:2024:TFS, author = "Garima Sharma and Karthikeyan Umapathy and Sridhar Krishnan", title = "Time-Frequency Scattergrams for Biomedical Audio Signal Representation and Classification", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "564--576", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3332544", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3332544", abstract = "Speech, music, and environmental sounds are the main forms of audio signals that are widely studied. There is a certain amount of texture present in every sound, and our human auditory system is not efficient in recognizing and classifying these audio \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Man:2024:WMD, author = "Zhibo Man and Zengcheng Huang and Yujie Zhang and Yu Li and Yuanmeng Chen and Yufeng Chen and Jinan Xu", title = "{WDSRL}: Multi-Domain Neural Machine Translation With Word-Level Domain-Sensitive Representation Learning", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "577--590", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3336515", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3336515", abstract = "Due to the strong reliance on domain-specific knowledge, the joint learning manner of domain discrimination and translation has been widely considered in the Multi-Domain Neural Machine Translation (MDNMT) task. However, the word ambiguity problem still \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2024:UMV, author = "Chin-Po Chen and Ho-Hsien Pan and Susan Shur-Fen Gau and Chi-Chun Lee", title = "Using Measures of Vowel Space for Autistic Traits Characterization", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "591--607", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3330605", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3330605", abstract = "Autism Spectrum Disorder (ASD) is a neurodevelopmental disorder that is prevalent and heterogeneous. Autistic traits describe a wide heterogeneity of behavior symptoms of ASD, and these traits are reflections of core neurodevelopment function deficits. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wilkinghoff:2024:WDA, author = "Kevin Wilkinghoff and Frank Kurth", title = "Why Do Angular Margin Losses Work Well for Semi-Supervised Anomalous Sound Detection?", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "608--622", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3337153", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3337153", abstract = "State- of-the-art anomalous sound detection systems often utilize angular margin losses to learn suitable representations of acoustic data using an auxiliary task, which usually is a supervised or self-supervised classification task. The underlying idea is \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Rouhe:2024:PCE, author = "Aku Rouhe and Tam{\'a}s Gr{\'o}sz and Mikko Kurimo", title = "Principled Comparisons for End-to-End Speech Recognition: Attention vs Hybrid at the $ 1000$-Hour Scale", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "623--638", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3336517", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3336517", abstract = "End- to-End speech recognition has become the center of attention for speech recognition research, but Hybrid Hidden Markov Model Deep Neural Network (HMM/DNN) -systems remain a competitive approach in terms of performance. End-to-End models may be better \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2024:LCS, author = "Yile Wang and Yue Zhang", title = "Lost in Context? {On} the Sense-Wise Variance of Contextualized Word Embeddings", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "639--650", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3337643", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3337643", abstract = "Contextualized word embeddings in language models have given much advance to NLP. Intuitively, sentential information is integrated into the representation of words, which can help model polysemy. However, context sensitivity also leads to the variance of \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hold:2024:CHO, author = "Christoph Hold and Ville Pulkki and Archontis Politis and Leo McCormack", title = "Compression of Higher-Order Ambisonic Signals Using Directional Audio Coding", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "651--665", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3328284", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3328284", abstract = "Delivering high-quality spatial audio in the Ambisonics format requires extensive data bandwidth, which may render it inaccessible for many low-bandwidth applications. Existing widely-available multi-channel audio compression codecs are not designed to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2024:NJT, author = "Shouhui Wang and Biao Qin", title = "A Novel Joint Training Model for Knowledge Base Question Answering", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "666--679", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3336526", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3336526", abstract = "In knowledge base question answering (KBQA) systems, relation detection and entity recognition are two core components. However, since the relation detection in KBQA contains thousands of relations and this task always becomes a zero-shot learning task \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2024:SCS, author = "Songbin Li and Jingang Wang and Peng Liu and Ke Shi", title = "{SANet}: a Compressed Speech Encoder and Steganography Algorithm Independent Steganalysis Deep Neural Network", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "680--690", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3337667", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3337667", abstract = "Most of the existing steganalysis methods for low-bit-rate compressed speech are specifically designed for a particular speech encoder or category of steganography methods, limiting their generalization capability. These methods require pre-selection of \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kanan:2024:IHC, author = "Tarek Kanan and Amani AbedAlghafer and Shadi AlZu'bi and Bilal Hawashin and Ala Mughaid and Ghassan Kanaan and M. M. Kamruzzaman", title = "An Intelligent Health Care System for Detecting Drug Abuse in Social Media Platforms Based on Low Resource Language", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "691--703", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3294699", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3294699", abstract = "Lately, the use of the Internet has led to an increase in social networking sites. The world has become an open environment, and social networking sites have been increasingly used to exchange medical experiences, and they have been adopted in many cases \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Varela:2024:ERS, author = "Alejandro Santorum Varela and Svetlana Stoyanchev and Simon Keizer and Rama Doddipatla and Kate Knill", title = "Entity Resolution in Situated Dialog With Unimodal and Multimodal Transformers", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "704--713", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3304468", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3304468", abstract = "In this work we address the entity resolution task for situated multimodal dialog investigating how a unimodal approach, which uses only textual information as input (representing visual attributes as text), compares to a multimodal system, which \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{He:2024:LSE, author = "Huang He and Hua Lu and Siqi Bao and Fan Wang and Hua Wu and Zheng-Yu Niu and Haifeng Wang", title = "Learning to Select External Knowledge With Multi-Scale Negative Sampling", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "714--720", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3301222", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3301222", abstract = "The Track-1 of DSTC9 aims to effectively answer user requests or questions during task-oriented dialogues, which are out of the scope of APIs/DB. By leveraging external knowledge resources, relevant information can be retrieved and encoded into the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lu:2024:TBO, author = "Hua Lu and Zhen Guo and Chanjuan Li and Yunyi Yang and Huang He and Siqi Bao", title = "Towards Building an Open-Domain Dialogue System Incorporated With {Internet} Memes", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "721--726", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3288413", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3288413", abstract = "In recent years, Internet memes have been widely used in online chatting. Compared with text-based communication, conversations become more expressive and attractive when Internet memes are incorporated. This article presents our solutions for the Meme \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lim:2024:AMD, author = "Jungwoo Lim and Taesun Whang and Dongyub Lee and Heuiseok Lim", title = "Adaptive Multi-Domain Dialogue State Tracking on Spoken Conversations", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "727--732", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3302232", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3302232", abstract = "The main objective of the task-oriented dialogue system is to identify the intent and needs of human dialogue. Many existing studies are conducted under the setting of written dialogue, but there always exists a difficulty in coping with real-world spoken \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Thulke:2024:TOD, author = "David Thulke and Nico Daheim and Christian Dugast and Hermann Ney", title = "Task-Oriented Document-Grounded Dialog Systems by {HLTPR@RWTH} for {DSTC9} and {DSTC10}", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "733--741", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3267832", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3267832", abstract = "This paper summarizes our contributions to the document-grounded dialog tasks at the 9th and 10th Dialog System Technology Challenges (DSTC9 and DSTC10). In both iterations the task consists of three subtasks: first detect whether the current turn is \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wu:2024:SAD, author = "Han Wu and Kun Xu and Linqi Song", title = "Structure-Aware Dialogue Modeling Methods for Conversational Semantic Role Labeling", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "742--752", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3331576", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3331576", abstract = "Conversational semantic role labeling (CSRL) is believed to be a crucial step toward dialogue understanding. By incorporating the CSRL information into the conversational models, previous work (Xu et al., 2021) has confirmed the usefulness of CSRL to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2024:DMC, author = "Zhe Chen and Hongcheng Liu and Yu Wang", title = "{DialogMCF}: Multimodal Context Flow for Audio Visual Scene-Aware Dialog", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "753--764", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3284511", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3284511", abstract = "In recent years, Audio Visual Scene-Aware Dialog (AVSD) has been an active research task in the multimodal dialogue community and has also been a core part of the Dialog System Technology Challenge (DSTC). This task is an extension of conventional visual \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yoshino:2024:OTD, author = "Koichiro Yoshino and Yun-Nung Chen and Paul Crook and Satwik Kottur and Jinchao Li and Behnam Hedayatnia and Seungwhan Moon and Zhengcong Fei and Zekang Li and Jinchao Zhang and Yang Feng and Jie Zhou and Seokhwan Kim and Yang Liu and Di Jin and Alexandros Papangelis and Karthik Gopalakrishnan and Dilek Hakkani-Tur and Babak Damavandi and Alborz Geramifard and Chiori Hori and Ankit Shah and Chen Zhang and Haizhou Li and Jo{\~a}o Sedoc and Luis F. D'Haro and Rafael Banchs and Alexander Rudnicky", title = "Overview of the Tenth Dialog System Technology Challenge: {DSTC10}", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "765--778", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3293030", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3293030", abstract = "This article introduces the Tenth Dialog System Technology Challenge (DSTC-10). This edition of the DSTC focuses on applying end-to-end dialog technologies for five distinct tasks in dialog systems, namely 1. Incorporation of Meme images into open domain \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yadav:2024:JDB, author = "Shekhar Kumar Yadav and Nithin V. George", title = "Joint Dereverberation and Beamforming With Blind Estimation of the Shape Parameter of the Desired Source Prior", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "779--793", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3335000", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3335000", abstract = "Dereverberation and acoustic beamforming is used to capture the speech of a desired speaker in the presence of interfering speakers in a reverberant room using an array of microphones. Traditionally, to perform these two tasks, the desired speech is \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2024:LSV, author = "Yanxiong Li and Zhongjie Jiang and Qisheng Huang and Wenchang Cao and Jialong Li", title = "Lightweight Speaker Verification Using Transformation Module With Feature Partition and Fusion", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "794--806", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3338533", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3338533", abstract = "Although many efforts have been made on decreasing the model complexity for speaker verification, it is still challenging to deploy speaker verification systems with satisfactory result on low-resource terminals. We design a transformation module that \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Dai:2024:DDN, author = "Yuhan Dai and Zhirui Zhang and Yichao Du and Shengcai Liu and Lemao Liu and Tong Xu", title = "Datastore Distillation for Nearest Neighbor Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "807--817", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3337633", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3337633", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2024:TSA, author = "Changtao Li and Feiran Yang and Jun Yang", title = "A Two-Stage Approach to Quality Restoration of Bone-Conducted Speech", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "818--829", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3337988", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3337988", abstract = "Bone- conducted speech is not susceptible to background noise but suffers from poor speech quality and intelligibility due to the limited bandwidth. This paper proposes a two-stage approach to restore the quality of bone-conducted speech, namely, bandwidth \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2024:CCI, author = "Jie Zhou and Yuanbiao Lin and Qin Chen and Qi Zhang and Xuanjing Huang and Liang He", title = "{CausalABSC}: Causal Inference for Aspect Debiasing in Aspect-Based Sentiment Classification", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "830--840", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3340606", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3340606", abstract = "As the primary subtask of sentiment analysis, aspect-based sentiment classification (ABSC) aims to predict the sentiment polarity for a given aspect. While recent deep neural models for ABSC have shown good performance, their robustness is limited due to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lu:2024:HTA, author = "Ruiying Lu and Bo Chen and Dandan Guo and Dongsheng Wang and Mingyuan Zhou", title = "Hierarchical Topic-Aware Contextualized Transformers", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "841--852", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3339344", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3339344", abstract = "Training on disjoint fixed-length segments, Transformers convert static word embeddings into contextualized word representations. However, they often restrict the context of a token to the segment it resides in and hence neglect the contextual information \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2024:FFD, author = "Yaru Zhao and Bo Cheng and Yakun Huang and Zhiguo Wan", title = "{FluGCF}: a Fluent Dialogue Generation Model With Coherent Concept Entity Flow", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "853--867", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3340610", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3340610", abstract = "The integration of external knowledge graphs into dialogue systems effectively mitigates the generation of generic and uninteresting responses. This approach, particularly the explicit modeling of conversation flows from related concept entities, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ding:2024:CAL, author = "Changhao Ding and Zhangjie Fu and Zhongliang Yang and Qi Yu and Daqiu Li and Yongfeng Huang", title = "Context-Aware Linguistic Steganography Model Based on Neural Machine Translation", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "868--878", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3340601", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3340601", abstract = "Linguistic steganography based on text generation is a hot topic in the field of text information hiding. Previous studies have managed to improve the syntactic quality of steganography texts using natural language processing techniques based on deep \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Alhakeem:2024:DRL, author = "Zainab Alhakeem and Se-In Jang and Hong-Goo Kang", title = "Disentangled Representations in Local-Global Contexts for {Arabic} Dialect Identification", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "879--890", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3341006", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3341006", abstract = "In this article, we propose a locally and globally informed disentanglement network for Arabic dialect identification (ADI). Our proposed disentanglement network aims to detach all irrelevant information (e.g., speaker, gender and channel) from the source \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lee:2024:PAW, author = "Jae-Hong Lee and Joon-Hyuk Chang", title = "Partitioning Attention Weight: Mitigating Adverse Effect of Incorrect Pseudo-Labels for Self-Supervised {ASR}", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "891--905", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3343615", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3343615", abstract = "The performance of automatic speech recognition (ASR) models has been significantly improved owing to advances in deep learning and end-to-end approaches. However, these require a large amount of labeled data, which are expensive to obtain. Semi-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fukuda:2024:IST, author = "Ryo Fukuda and Katsuhito Sudoh and Satoshi Nakamura", title = "Improving Speech Translation Accuracy and Time Efficiency With Fine-Tuned wav2vec 2.0-Based Speech Segmentation", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "906--916", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3343614", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3343614", abstract = "Speech translation (ST) automatically converts utterances in a source language into text in another language. Splitting continuous speech into shorter segments, known as speech segmentation, plays an important role in ST. Recent segmentation methods \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Leem:2024:SAF, author = "Seong-Gyun Leem and Daniel Fulford and Jukka-Pekka Onnela and David Gard and Carlos Busso", title = "Selective Acoustic Feature Enhancement for Speech Emotion Recognition With Noisy Speech", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "917--929", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3340603", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3340603", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Bohlender:2024:SSS, author = "Alexander Bohlender and Ann Spriet and Wouter Tirry and Nilesh Madhu", title = "Spatially Selective Speaker Separation Using a {DNN} With a Location Dependent Feature Extraction", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "930--945", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3343605", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3343605", abstract = "Deep neural networks (DNNs) have proven themselves as an effective means to separate clean speech from noisy mixtures. When there are multiple concurrent talkers, however, unambiguously defining the target output is not trivial, especially if the mixture \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Karo:2024:CTD, author = "Matan Karo and Arie Yeredor and Itshak Lapidot", title = "Compact Time-Domain Representation for Logical Access Spoofed Audio", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "946--958", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3341000", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3341000", abstract = "Anti- spoofing is the task of speech authentication. That is, identifying genuine human speech compared to spoofed speech. The main focus of this paper is to suggest new representations for genuine and spoofed speech, based on the probability mass function \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Berebi:2024:ADH, author = "Or Berebi and Zamir Ben-Hur and David Lou Alon and Boaz Rafaely", title = "Analysis and Design of Head-Tracked Compensation for Bilateral Ambisonics", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "959--972", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3345140", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3345140", abstract = "Virtual and augmented reality technologies demand high-quality spatial sound recording and playback through headphones. However, achieving high-quality binaural reproduction requires a complex recording system and a large number of microphones. To address \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2024:UCL, author = "Wei Wang and Yanmin Qian", title = "Universal Cross-Lingual Data Generation for Low Resource {ASR}", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "973--983", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3345150", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3345150", abstract = "Significant advances in end-to-end (E2E) automatic speech recognition (ASR) have primarily been concentrated on languages rich in annotated data. Nevertheless, a large proportion of languages worldwide, which are typically low-resource, continue to pose \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Berghi:2024:LVS, author = "Davide Berghi and Philip J. B. Jackson", title = "Leveraging Visual Supervision for Array-Based Active Speaker Detection and Localization", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "984--995", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3346643", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3346643", abstract = "Conventional audio-visual approaches for active speaker detection (ASD) typically rely on visually pre-extracted face tracks and the corresponding single-channel audio to find the speaker in a video. Therefore, they tend to fail every time the face of the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Krause:2024:BSS, author = "Daniel Aleksander Krause and Guillermo Garc{\'\i}a-Barrios and Archontis Politis and Annamaria Mesaros", title = "Binaural Sound Source Distance Estimation and Localization for a Moving Listener", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "996--1011", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3346297", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3346297", abstract = "In this paper, we investigate the tasks of binaural source distance estimation (SDE) and direction-of-arrival estimation (DOAE) using motion-based cues in a scenario with a walking listener. On top of performing both tasks as separate problems, we study \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kim:2024:ASR, author = "Seung-Bin Kim and Sang-Hoon Lee and Ha-Yeong Choi and Seong-Whan Lee", title = "Audio Super-Resolution With Robust Speech Representation Learning of Masked Autoencoder", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1012--1022", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3349053", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3349053", abstract = "This paper proposes Fre-Painter, a high-fidelity audio super-resolution system that utilizes robust speech representation learning with various masking strategies. Recently, masked autoencoders have been found to be beneficial in learning robust \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Battal:2024:ACS, author = "Omer Musa Battal and Aykut Ko{\c{c}}", title = "Automatic Construction of Sememe Knowledge Bases From Machine Readable Dictionaries", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1023--1035", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3347927", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3347927", abstract = "Sememes are the minimum semantic units of natural languages. Words annotated with sememes are organized into Sememe Knowledge Bases (SKBs). SKBs are successfully applied to various high-level language processing tasks as external knowledge bases. However, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Krishna:2024:RLH, author = "Varun Krishna and Tarun Sai and Sriram Ganapathy", title = "Representation Learning With Hidden Unit Clustering for Low Resource Speech Applications", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1036--1047", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3337670", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3337670", abstract = "In this paper, we describe an approach to self-supervised representation learning from raw audio using a hidden unit clustering (HUC) framework. The input to the model consists of audio samples that are windowed and processed with 1-D convolutional \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Luo:2024:DGF, author = "Zhengding Luo and Dongyuan Shi and Woon-Seng Gan and Qirui Huang", title = "Delayless Generative Fixed-Filter Active Noise Control Based on Deep Learning and {Bayesian} Filter", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1048--1060", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3337632", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3337632", abstract = "The selective fixed-filter active noise control (SFANC) method can select suitable pre-trained control filters to attenuate incoming noises. However, the limited number of pre-trained filters is insufficient to effectively control various forms of noise, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chi:2024:CPE, author = "Zewen Chi and Heyan Huang and Luyang Liu and Yu Bai and Xiaoyan Gao and Xian-Ling Mao", title = "Can Pretrained {English} Language Models Benefit Non-{English} {NLP} Systems in Low-Resource Scenarios?", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1061--1074", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3267618", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3267618", abstract = "Pretrained language models have achieved great success in a wide range of natural language processing (NLP) problems, because they learn language representations from large-scale text corpora and can adapt to downstream tasks by finetuning them on \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2024:TSL, author = "Rui Liu and Yifan Hu and Haolin Zuo and Zhaojie Luo and Longbiao Wang and Guanglai Gao", title = "Text-to-Speech for Low-Resource Agglutinative Language With Morphology-Aware Language Model Pre-Training", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1075--1087", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3348762", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3348762", abstract = "Text- to-Speech (TTS) aims to convert the input text to a human-like voice. With the development of deep learning, encoder-decoder based TTS models perform superior performance, in terms of naturalness, in mainstream languages such as Chinese, English, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jiang:2024:ERE, author = "Shu Jiang and Zuchao Li and Hai Zhao and Weiping Ding", title = "Entity-Relation Extraction as Full Shallow Semantic Dependency Parsing", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1088--1099", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3350905", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3350905", abstract = "Entity- relation extraction is the essential information extraction task and can be decomposed into Named Entity Recognition (NER) and Relation Extraction (RE) subtasks. This paper proposes a novel joint entity-relation extraction method that models the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Vered:2024:PAD, author = "Yoav Vered and Stephen Elliott", title = "A Parallel Analog and Digital Adaptive Feedforward Controller for Active Noise Control", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1100--1108", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3350882", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3350882", abstract = "Digital adaptive controllers are widely used for feedforward active noise control, especially in headphones. In such applications, the secondary path delay, including the sampling and reconstruction effects, must be shorter than the primary path delay to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2024:ISSb, author = "Puning Zhang and Rongjian Zhao and Boran Yang and Yuexian Li and Zhigang Yang", title = "Integrated Syntactic and Semantic Tree for Targeted Sentiment Classification Using Dual-Channel Graph Convolutional Network", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1109--1124", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3350877", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3350877", abstract = "Targeted sentiment analysis aims to identify the sentiment polarity of specific target mentions in a sentence. Existing methods employ neural networks to extract the relations between target mentions and their contexts. Recent approaches based on graph \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2024:DCC, author = "Xu Wang and Hainan Zhang and Shuai Zhao and Hongshen Chen and Zhuoye Ding and Zhiguo Wan and Bo Cheng and Yanyan Lan", title = "Debiasing Counterfactual Context With Causal Inference for Multi-Turn Dialogue Reasoning", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1125--1132", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3343608", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3343608", abstract = "In the multi-turn dialogue reasoning task, existing models conduct word-level interaction on the entire context to gather reasoning evidence, which aims to select the logically correct one from the candidate response options. Observing the fact that the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chau:2024:NAM, author = "Hoang Ngoc Chau and Tien Dat Bui and Huu Binh Nguyen and Thanh Thi Hien Duong and Quoc Cuong Nguyen", title = "A Novel Approach to Multi-Channel Speech Enhancement Based on Graph Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1133--1144", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3352259", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3352259", abstract = "Multi- channel speech enhancement aims at utilizing spatial relationships between signals captured from a microphone array along with temporal-spectral information efficiently to estimate the clean target. An emerging approach is to design deep learning-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Hu:2024:WRC, author = "Yuchen Hu and Chen Chen and Qiushi Zhu and Eng Siong Chng", title = "{Wav2code}: Restore Clean Speech Representations via Codebook Lookup for Noise-Robust {ASR}", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1145--1156", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3332545", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3332545", abstract = "Automatic speech recognition (ASR) has gained remarkable successes thanks to recent advances of deep learning, but it usually degrades significantly under real-world noisy conditions. Recent works introduce speech enhancement (SE) as front-end to improve \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ueda:2024:BSR, author = "Tetsuya Ueda and Tomohiro Nakatani and Rintaro Ikeshita and Keisuke Kinoshita and Shoko Araki and Shoji Makino", title = "Blind and Spatially-Regularized Online Joint Optimization of Source Separation, Dereverberation, and Noise Reduction", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1157--1172", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3351353", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3351353", abstract = "This paper proposes a computationally efficient joint optimization algorithm that performs online source separation, dereverberation, and noise reduction based on blind and spatially-regularized processing. When applying such online Blind Source \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Agarwal:2024:TTG, author = "Vibhav Agarwal and Sourav Ghosh and Harichandana BSS and Himanshu Arora and Barath Raj Kandur Raja", title = "{TrICy}: Trigger-Guided Data-to-Text Generation With Intent Aware Attention-Copy", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1173--1184", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3353574", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3353574", abstract = "Data- to-text (D2T) generation is a crucial task in many natural language understanding (NLU) applications and forms the foundation of task-oriented dialog systems. In the context of conversational AI solutions that can work directly with local data on the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Boeddeker:2024:TSJ, author = "Christoph Boeddeker and Aswin Shanmugam Subramanian and Gordon Wichern and Reinhold Haeb-Umbach and Jonathan {Le Roux}", title = "{TS-SEP}: Joint Diarization and Separation Conditioned on Estimated Speaker Embeddings", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1185--1197", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3350887", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3350887", abstract = "Since diarization and source separation of meeting data are closely related tasks, we here propose an approach to perform the two objectives jointly. It builds upon the target-speaker voice activity detection (TS-VAD) diarization approach, which assumes \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Varzandeh:2024:SAB, author = "Reza Varzandeh and Simon Doclo and Volker Hohmann", title = "Speech-Aware Binaural {DOA} Estimation Utilizing Periodicity and Spatial Features in Convolutional Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1198--1213", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3356987", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3356987", abstract = "In recent years, several supervised learning-based approaches have been proposed for estimating the direction of arrival (DOA) of a single talker in noisy and reverberant environments. In the absence of auxiliary information, such as a voice activity \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ozer:2024:SSP, author = "Yigitcan {\"O}zer and Meinard M{\"u}ller", title = "Source Separation of Piano Concertos Using Musically Motivated Augmentation Techniques", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1214--1225", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3356980", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3356980", abstract = "In this work, we address the novel and rarely considered source separation task of decomposing piano concerto recordings into separate piano and orchestral tracks. Being a genre written for a pianist typically accompanied by an ensemble or orchestra, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Frenkel:2024:DAU, author = "Lior Frenkel and Shlomo E. Chazan and Jacob Goldberger", title = "Domain Adaptation Using Suitable Pseudo Labels for Speech Enhancement and Dereverberation", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1226--1236", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3358051", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3358051", abstract = "Speech enhancement and dereverberation approaches based on neural networks are designed to learn a transformation from noisy to clean speech using supervised learning. However, networks trained in this way may fail to effectively handle languages, types \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2024:DTR, author = "Jiahao Zhao and Wenji Mao and Daniel Dajun Zeng", title = "Disentangled Text Representation Learning With Information-Theoretic Perspective for Adversarial Robustness", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1237--1247", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3358052", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3358052", abstract = "Adversarial vulnerability remains a major obstacle to the construction of reliable NLP systems. When imperceptible perturbations are added to raw input text, the performance of a deep learning model may drop dramatically under attacks. Recent work has \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2024:CMI, author = "Dong Zhou and Fang Lei and Lin Li and Yongmei Zhou and Aimin Yang", title = "Cross-Modal Interaction via Reinforcement Feedback for Audio-Lyrics Retrieval", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1248--1260", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3358048", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3358048", abstract = "The task of retrieving audio content relevant to lyric queries and vice versa plays a critical role in music-oriented applications. In this process, robust feature representations have to be learned for two modalities. Furthermore, interactions between \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2024:GSV, author = "Xuechen Liu and Md Sahidullah and Kong Aik Lee and Tomi Kinnunen", title = "Generalizing Speaker Verification for Spoof Awareness in the Embedding Space", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1261--1273", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3358056", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3358056", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Cui:2024:EME, author = "Shiyao Cui and Jiangxia Cao and Xin Cong and Jiawei Sheng and Quangang Li and Tingwen Liu and Jinqiao Shi", title = "Enhancing Multimodal Entity and Relation Extraction With Variational Information Bottleneck", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1274--1285", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3345146", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3345146", abstract = "This article studies the multimodal named entity recognition (MNER) and multimodal relation extraction (MRE), which are important for content analysis and various applications. The core of MNER and MRE lies in incorporating evident visual information to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Tan:2024:ASC, author = "Yizhou Tan and Haojun Ai and Shengchen Li and Mark D. Plumbley", title = "Acoustic Scene Classification Across Cities and Devices via Feature Disentanglement", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1286--1297", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3353578", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3353578", abstract = "Acoustic Scene Classification (ASC) is a task that classifies a scene according to environmental acoustic signals. Audios collected from different cities and devices often exhibit biases in feature distributions, which may negatively impact ASC \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{BenZaken:2024:NNB, author = "Orel {Ben Zaken} and Anurag Kumar and Vladimir Tourbabin and Boaz Rafaely", title = "Neural- Network-Based Direction-of-Arrival Estimation for Reverberant Speech --- The Importance of Energetic, Temporal, and Spatial Information", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1298--1309", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3357037", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3357037", abstract = "Direction- of-arrival (DOA) estimation is a fundamental task in audio signal processing that becomes difficult in real-world environments due to the presence of reverberation. To address this difficulty, Direct-Path Dominance (DPD) tests have been proposed \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Quan:2024:SEL, author = "Changsheng Quan and Xiaofei Li", title = "{SpatialNet}: Extensively Learning Spatial Information for Multichannel Joint Speech Separation, Denoising and Dereverberation", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1310--1323", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3357036", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3357036", abstract = "This work proposes a neural network to extensively exploit spatial information for multichannel joint speech separation, denoising and dereverberation, named SpatialNet. In the short-time Fourier transform (STFT) domain, the proposed network performs end-. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Baas:2024:DGU, author = "Matthew Baas and Herman Kamper", title = "Disentanglement in a {GAN} for Unconditional Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1324--1335", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3359352", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3359352", abstract = "Can we develop a model that can synthesize realistic speech directly from a latent space, without explicit conditioning? Despite several efforts over the last decade, previous adversarial and diffusion-based approaches still struggle to achieve this, even \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2024:SSA, author = "Xian Li and Nian Shao and Xiaofei Li", title = "Self-Supervised Audio Teacher-Student Transformer for Both Clip-Level and Frame-Level Tasks", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1336--1351", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3352248", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3352248", abstract = "Self- supervised learning (SSL) has emerged as a popular approach for learning audio representations. One goal of audio self-supervised pre-training is to transfer knowledge to downstream audio tasks, generally including clip-level and frame-level tasks. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2024:ITC, author = "Yifan Chen and Gaofeng Cheng and Runyan Yang and Pengyuan Zhang and Yonghong Yan", title = "Interrelate Training and Clustering for Online Speaker Diarization", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1352--1364", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3357033", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3357033", abstract = "In clustering-based speaker diarization systems, the embedding clusters for distinctive speakers exhibit wide variability in size and density, posing difficulty for clustering accuracy. In spite of this, with the assistance of the overall distance \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Feng:2024:MHT, author = "Sheng Feng and Xiaoqian Zhu and Shuqing Ma", title = "Masking Hierarchical Tokens for Underwater Acoustic Target Recognition With Self-Supervised Learning", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1365--1379", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3358719", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3358719", abstract = "Deep learning has made data-driven methods effective in underwater acoustic target recognition (UATR) using passive sonar signals. However, a major current challenge is the limited availability of underwater acoustic data, leading to suboptimal \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhao:2024:DDN, author = "Yangyang Zhao and Kai Yin and Zhenyu Wang and Mehdi Dastani and Shihan Wang", title = "Decomposed Deep {$Q$}-Network for Coherent Task-Oriented Dialogue Policy Learning", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1380--1391", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3357038", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3357038", abstract = "Reinforcement learning (RL) has emerged as a key technique for designing dialogue policies. However, action space inflation in dialogue tasks has led to a heavy decision burden and incoherence problems for dialogue policies. In this paper, we propose a \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Parekh:2024:TIA, author = "Jayneel Parekh and Sanjeel Parekh and Pavlo Mozharovskyi and Ga{\"e}l Richard and Florence d'Alch{\'e}-Buc", title = "Tackling Interpretability in Audio Classification Networks With Non-negative Matrix Factorization", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1392--1405", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3358049", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3358049", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2024:WSS, author = "Xiuying Chen and Shen Gao and Mingzhe Li and Qingqing Zhu and Xin Gao and Xiangliang Zhang", title = "Write Summary Step-by-Step: a Pilot Study of Stepwise Summarization", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1406--1415", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3357040", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3357040", abstract = "Nowadays, neural text generation has made tremendous progress in abstractive summarization tasks. However, most of the existing summarization models take in the whole document all at once, which sometimes cannot meet the needs in practice. Practically, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Lin:2024:MIF, author = "Changkai Lin and Hongju Cheng and Qiang Rao and Yang Yang", title = "{M$^3$SA}: Multimodal Sentiment Analysis Based on Multi-Scale Feature Extraction and Multi-Task Learning", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1416--1429", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3361374", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3361374", abstract = "Sentiment analysis plays an indispensable part in human-computer interaction. Multimodal sentiment analysis can overcome the shortcomings of unimodal sentiment analysis by fusing multimodal data. However, how to extracte improved feature representations \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zheng:2024:IUT, author = "Rui-Chen Zheng and Yang Ai and Zhen-Hua Ling", title = "Incorporating Ultrasound Tongue Images for Audio-Visual Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1430--1444", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3361376", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3361376", abstract = "Audio- visual speech enhancement (AV-SE) aims to enhance degraded speech along with extra visual information such as lip videos, and has been shown to be more effective than audio-only speech enhancement. This paper proposes the incorporation of ultrasound \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Biswas:2024:SGN, author = "Ritujoy Biswas and Karan Nathwani and Vinayak Abrol", title = "Statistically Guided Near-End Speech Intelligibility Improvement Through Voice Transformation and Transfer Learning", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1445--1456", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3359893", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3359893", abstract = "In recent developments, speech intelligibility has been improved through an optimal trapezoidal transformation function, which performed normal to Lombard speech conversion via formant shifting. Despite performing well, the optimization took very long to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Sun:2024:DBM, author = "Linhui Sun and Shuo Yuan and Aifei Gong and Lei Ye and Eng Siong Chng", title = "Dual-Branch Modeling Based on State-Space Model for Speech Enhancement", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1457--1467", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3362691", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3362691", abstract = "Traditional time-frequency domain speech enhancement methods either only enhance the amplitude spectral features without changing the phase that contributes to the naturalness, intelligibility and harmonic structure, or improve the estimation of the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Koudounas:2024:TCS, author = "Alkis Koudounas and Eliana Pastor and Giuseppe Attanasio and Vittorio Mazzia and Manuel Giollo and Thomas Gueudre and Elisa Reale and Luca Cagliero and Sandro Cumani and Luca de Alfaro and Elena Baralis and Daniele Amberti", title = "Towards Comprehensive Subgroup Performance Analysis in Speech Models", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1468--1480", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3363447", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3363447", abstract = "The evaluation of spoken language understanding (SLU) systems is often restricted to assessing their global performance or examining predefined subgroups of interest. However, a more detailed analysis at the subgroup level has the potential to uncover \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Xiong:2024:JDE, author = "Wenmeng Xiong and Changchun Bao and Jing Zhou and Maoshen Jia and Jos{\'e} Picheral", title = "Joint {DOA} Estimation and Dereverberation Based on Multi-Channel Linear Prediction Filtering and Azimuth Sparsity", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1481--1493", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3363441", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3363441", abstract = "Source localization in reverberant environments has been a prominent research topic in the past two decades. In this paper, instead of the commonly employed time-frequency (TF) bin based methods which rely on empirically selected threshold values, we \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Alkaher:2024:HDG, author = "Yehav Alkaher and Israel Cohen", title = "Howling Detection and Gain Control for Speech Reinforcement in a Noisy Car Cabin Environment", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1494--1505", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3364091", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3364091", abstract = "In- car speech communication is particularly challenging due to environmental noise. The speaker's microphone also acquires car and road noises, resulting in a low signal-to-noise ratio and persistent frequency-howls that do not decrease, which \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhu:2024:MME, author = "Xinfa Zhu and Yi Lei and Tao Li and Yongmao Zhang and Hongbin Zhou and Heng Lu and Lei Xie", title = "{METTS}: Multilingual Emotional Text-to-Speech by Cross-Speaker and Cross-Lingual Emotion Transfer", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1506--1518", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3363444", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3363444", abstract = "Previous multilingual text-to-speech (TTS) approaches have considered leveraging monolingual speaker data to enable cross-lingual speech synthesis. However, such data-efficient approaches have ignored synthesizing emotional aspects of speech due to the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jeong:2024:TLL, author = "Myeonghun Jeong and Minchan Kim and Byoung Jin Choi and Jaesam Yoon and Won Jang and Nam Soo Kim", title = "Transfer Learning for Low-Resource, Multi-Lingual, and Zero-Shot Multi-Speaker Text-to-Speech", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1519--1530", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3364085", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3364085", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yao:2024:IST, author = "Jiadi Yao and Hong Luo and Jun Qi and Xiao-Lei Zhang", title = "Interpretable Spectrum Transformation Attacks to Speaker Recognition Systems", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1531--1545", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3364100", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3364100", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2024:SLN, author = "Xiang Chen and Lei Li and Yuqi Zhu and Shumin Deng and Chuanqi Tan and Fei Huang and Luo Si and Ningyu Zhang and Huajun Chen", title = "Sequence Labeling as Non-Autoregressive Dual-Query Set Generation", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1546--1558", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3358053", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3358053", abstract = "Sequence labeling is a crucial task in the NLP community that aims at identifying and assigning spans within the input sentence. It has wide applications in various fields such as information extraction, dialogue system, and sentiment analysis. However, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2024:CPE, author = "Lei Liu and Li Liu and Haizhou Li", title = "Computation and Parameter Efficient Multi-Modal Fusion Transformer for Cued Speech Recognition", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1559--1572", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3363446", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3363446", abstract = "Cued Speech (CS) is a pure visual coding method used by hearing-impaired people that combines lip reading with several specific hand shapes to make the spoken language visible. Automatic CS recognition (ACSR) seeks to transcribe visual cues of speech into \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Barahona-Rios:2024:NCT, author = "Adri{\'a}n Barahona-R{\'\i}os and Tom Collins", title = "{NoiseBandNet}: Controllable Time-Varying Neural Synthesis of Sound Effects Using Filterbanks", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1573--1585", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3364616", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3364616", abstract = "Controllable neural audio synthesis of sound effects is a challenging task due to the potential scarcity and spectro-temporal variance of the data. Differentiable digital signal processing (DDSP) synthesisers have been successfully employed to model and \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2024:USR, author = "Siyuan Wang and Zhongyu Wei and Jiarong Xu and Taishan Li and Zhihao Fan", title = "Unifying Structure Reasoning and Language Pre-Training for Complex Reasoning Tasks", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1586--1595", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3325973", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3325973", abstract = "Recent pre-trained language models (PLMs) equipped with foundation reasoning skills have shown remarkable performance on downstream complex tasks. However, the significant structure reasoning skill has been rarely studied, which involves modeling implicit \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chu:2024:NDF, author = "Yijing Chu and Sipei Zhao and Feng Niu and Yongzheng Dong and Yuezhe Zhao", title = "A New Diffusion Filtered-{$X$} Affine Projection Algorithm: Performance Analysis and Application in Windy Environment", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1596--1608", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3363409", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3363409", abstract = "Wind noise caused by turbulent flows over microphones usually has detrimental impacts on the reference signal of an active noise control (ANC) system and degrade its performance considerably. This paper evaluates the influence of wind noise on the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Le:2024:IFT, author = "Yuquan Le and Zhe Quan and Jiawei Wang and Da Cao and Kenli Li", title = "{$ R^2 $}: a Novel Recall \& Ranking Framework for Legal Judgment Prediction", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1609--1622", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3365389", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3365389", abstract = "The legal judgment prediction (LJP) task is to automatically decide appropriate law articles, charges, and term of penalty for giving the fact description of a law case. It considerably influences many real legal applications and has thus attracted the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Jiang:2024:CDA, author = "Xiaotong Jiang and Ruirui Bai and Zhongqing Wang and Guodong Zhou", title = "Cross-Domain Aspect-Based Sentiment Classification With Tripartite Graph Modeling", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1623--1635", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3365975", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3365975", abstract = "Previous studies on cross-domain aspect-based sentiment classification depend on the pivot features or utilize the target data for representation learning, which ignores the correlations between instances and words. In this study, we employ two strategies \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Chen:2024:ABE, author = "Zhengyang Chen and Bing Han and Shuai Wang and Yanmin Qian", title = "Attention-Based Encoder-Decoder End-to-End Neural Diarization With Embedding Enhancer", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1636--1649", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3366756", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3366756", abstract = "Deep neural network-based systems have significantly improved the performance of speaker diarization tasks. However, end-to-end neural diarization (EEND) systems often struggle to generalize to scenarios with an unseen number of speakers, while target \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Miao:2024:EVE, author = "Chenfeng Miao and Qingying Zhu and Minchuan Chen and Jun Ma and Shaojun Wang and Jing Xiao", title = "{EfficientTTS 2}: Variational End-to-End Text-to-Speech Synthesis and Voice Conversion", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1650--1661", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3369528", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3369528", abstract = "Recently, the field of Text-to-Speech (TTS) has been dominated by one-stage text-to-waveform models which have significantly improved speech quality compared to two-stage models. In this work, we propose EfficientTTS 2 (EFTS2), a one-stage high-quality \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Peretz:2024:CEB, author = "Orel Peretz and Israel Cohen", title = "Constant Elevation-Beamwidth Beamforming With Concentric Ring Arrays", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1662--1672", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3365390", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3365390", abstract = "A hybrid approach is proposed to efficiently design a constant elevation-beamwidth beamforming with concentric ring arrays (CRAs). The design exploits the degrees of freedom of the array geometry for superior performance. In particular, the ring radii and \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Quan:2024:MMA, author = "Zhibin Quan and Chi-Man Vong and Weili Zeng and Wankou Yang", title = "The {MorPhEMe} Machine: an Addressable Neural Memory for Learning Knowledge-Regularized Deep Contextualized {Chinese} Embedding", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1673--1686", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3364610", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3364610", abstract = "Deep contextualized embeddings, as learned by large pre-training models, have proven highly effective in various downstream natural language processing tasks. However, the embedding space in these large models lacks explicit regularization, leading to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gao:2024:LTE, author = "Lijian Gao and Qirong Mao and Ming Dong", title = "On Local Temporal Embedding for Semi-Supervised Sound Event Detection", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1687--1698", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3369529", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3369529", abstract = "Semi- supervised sound event detection (SSED) task requires recognizing the categories of events and marking each event's onset and offset times in a mixed audio recording using a small amount of weakly labeled and a large scale of unlabeled data. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhou:2024:ATS, author = "Xuehao Zhou and Mingyang Zhang and Yi Zhou and Zhizheng Wu and Haizhou Li", title = "Accented Text-to-Speech Synthesis With Limited Data", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1699--1711", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3363414", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3363414", abstract = "This paper presents an accented text-to-speech (TTS) synthesis framework with limited training data. We study two aspects concerning accent rendering: phonetic (phoneme difference) and prosodic (pitch pattern and phoneme duration) variations. The proposed \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kothapally:2024:MSD, author = "Vinay Kothapally and John H. L. Hansen", title = "Monaural Speech Dereverberation Using Deformable Convolutional Networks", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1712--1723", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3358720", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3358720", abstract = "Reverberation and background noise can degrade speech quality and intelligibility when captured by a distant microphone. In recent years, researchers have developed several deep learning (DL)-based single-channel speech dereverberation systems that aim to \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2024:MLP, author = "Taihui Wang and Feiran Yang and Jun Yang", title = "Multichannel Linear Prediction-Based Speech Dereverberation Considering Sparse and Low-Rank Priors", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1724--1735", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3369535", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3369535", abstract = "This article addresses the multi-channel linear prediction (MCLP)-based speech dereverberation problem by jointly considering the sparsity and low-rank priors of speech spectrograms. We utilize the complex generalized Gaussian (CGG) distribution as the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Kataria:2024:TDS, author = "Saurabh Kataria and Jes{\'u}s Villalba and Laureano Moro-Vel{\'a}zquez and Piotr {\.Z}elasko and Najim Dehak", title = "Time-Domain Speech Super-Resolution With {GAN} Based Modeling for Telephony Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1736--1749", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3369536", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3369536", abstract = "Automatic Speaker Verification(ASV) technology has become commonplace in virtual assistants. However, its performance suffers when there is a mismatch between the train and test domains. Mixed bandwidth training, i.e., pooling training data from both \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Olivieri:2024:AIC, author = "Marco Olivieri and Amy Bastine and Mirco Pezzoli and Fabio Antonacci and Thushara Abhayapala and Augusto Sarti", title = "Acoustic Imaging With Circular Microphone Array: a New Approach for Sound Field Analysis", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1750--1761", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3369533", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3369533", abstract = "Acoustic imaging is powerful in collecting spatial information of acoustic sources into a visual representation. In this paper, we focus on the analysis of the exterior acoustic field captured by a circular array of microphones. With a proper \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Liu:2024:HMG, author = "Tengfei Liu and Yongli Hu and Junbin Gao and Yanfeng Sun and Baocai Yin", title = "Hierarchical Multi-Granularity Interaction Graph Convolutional Network for Long Document Classification", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1762--1775", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3369530", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3369530", abstract = "With the growing demand for text analytics, long document classification (LDC) has received extensive attention, and great progress has been made. To reveal the complex structure and extract the intrinsic feature, the current approaches focus on modeling \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{OShaughnessy:2024:RMA, author = "Douglas O'Shaughnessy", title = "Review of Methods for Automatic Speaker Verification", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1776--1789", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2023.3346293", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2023.3346293", abstract = "A review of techniques to identify speakers from their voices is presented, noting strengths and weaknesses of various methods. Similar acoustic analysis has been often used for both speech and speaker recognition, despite the two tasks being quite \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Thuillier:2024:HIU, author = "Etienne Thuillier and Craig T. Jin and Vesa V{\"a}lim{\"a}ki", title = "{HRTF} Interpolation Using a Spherical Neural Process Meta-Learner", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1790--1802", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3361377", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3361377", abstract = "Several individualization methods have recently been proposed to estimate a subject's Head-Related Transfer Function (HRTF) using convenient input modalities such as anthropometric measurements or pinnae photographs. There exists a need for \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gong:2024:ALC, author = "Xun Gong and Yu Wu and Jinyu Li and Shujie Liu and Rui Zhao and Xie Chen and Yanmin Qian", title = "Advanced Long-Content Speech Recognition With Factorized Neural Transducer", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1803--1815", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3350893", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3350893", abstract = "Long- content automatic speech recognition (ASR) has obtained increasing interest in recent years, as it captures the relationship among consecutive historical utterances while decoding the current utterance. In this paper, we propose two novel approaches, \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Masuyama:2024:EJO, author = "Yoshiki Masuyama and Kouei Yamaoka and Takao Kawamura and Nobutaka Ono", title = "Efficient Joint Optimization of Sampling Rate Offsets Using Entire Multichannel Signal", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1816--1828", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3369532", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3369532", abstract = "In this paper, we propose a joint estimation method for the sampling rate offsets (SROs) of multiple recording devices. In wireless acoustic sensor networks, distributed microphones are connected to different analog-to-digital converters, and thus SROs \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Saeki:2024:TIG, author = "Takaaki Saeki and Soumi Maiti and Xinjian Li and Shinji Watanabe and Shinnosuke Takamichi and Hiroshi Saruwatari", title = "Text-Inductive Graphone-Based Language Adaptation for Low-Resource Speech Synthesis", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1829--1844", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3369537", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3369537", abstract = "Neural text-to-speech (TTS) systems have made significant progress in generating natural synthetic speech. However, neural TTS requires large amounts of paired training data, which limits its applicability to a small number of resource-rich languages. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Gao:2024:ACS, author = "Yingming Gao and Peter Birkholz and Ya Li", title = "Articulatory Copy Synthesis Based on the Speech Synthesizer {VocalTractLab} and Convolutional Recurrent Neural Networks", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1845--1858", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3372874", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3372874", abstract = "Articulatory copy synthesis (ACS) refers to the synthetic reproduction of natural utterances. The existing methods of ACS have the limitations of poor generalizability for unknown speakers, high computing costs, the lack of systematic evaluation, etc. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Mariotte:2024:CCA, author = "Th{\'e}o Mariotte and Anthony Larcher and Silvio Montr{\'e}sor and Jean-Hugh Thomas", title = "Channel-Combination Algorithms for Robust Distant Voice Activity and Overlapped Speech Detection", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1859--1872", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3369531", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3369531", abstract = "Voice Activity Detection (VAD) and Overlapped Speech Detection (OSD) are key pre-processing tasks for speaker diarization. In the meeting context, it is often easier to capture speech with a distant device. This consideration however leads to severe \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{deSouza:2024:EBM, author = "Luciana M. X. de Souza and M{\'a}rcio H. Costa and Renata Coelho Borges", title = "Envelope-Based Multichannel Noise Reduction for Cochlear Implant Applications", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1873--1884", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3372891", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3372891", abstract = "Cochlear implants (CI) are implantable electronic prostheses that aim to restore communication in people with severe to profound hearing loss. This is achieved by transforming the acoustic signals into electrical stimuli and applying them directly to the \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2024:UDL, author = "Linjian Li and Yi Cai and Xin Wu", title = "Unsupervised Disentanglement Learning Model for Exemplar-Guided Paraphrase Generation", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1885--1900", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3374124", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3374124", abstract = "Exemplar- guided paraphrase generation is the task of generating a paraphrase for a source sentence when given another exemplar sentence as syntactic guidance information. The target sentence must convey the semantics of the source sentence in surface form,. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Ivry:2024:UCA, author = "Amir Ivry and Israel Cohen and Baruch Berdugo", title = "A User-Centric Approach for Deep Residual-Echo Suppression in Double-Talk", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1901--1914", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3374064", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3374064", abstract = "We introduce a user-centric residual-echo suppression (URES) framework in double-talk. This framework receives a user operating point (UOP) that consists of two metric values: the residual echo suppression level (RESL) and the desired speech-maintained \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Zhang:2024:QDR, author = "Geng Zhang and Jin Liu and Guangyou Zhou and Kunsong Zhao and Zhiwen Xie and Bo Huang", title = "Question-Directed Reasoning With Relation-Aware Graph Attention Network for Complex Question Answering Over Knowledge Graph", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1915--1927", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3375631", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3375631", abstract = "Complex knowledge graph question answering (KGQA) aims at answering natural language questions by entities retrieving from a knowledge graph (KG). Recently, the relation path-based models have shown the unique advantage for complex KGQA. However, these \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Yao:2024:KLD, author = "Yu Yao and Peng Yang and Guangzhen Zhao and Guoshun Yin", title = "{KGAgent}: Learning a Deep Reinforced Agent for Keyphrase Generation", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1928--1940", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3375630", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3375630", abstract = "Keyphrase generation (KG) is an essential problem in many natural language processing (NLP) tasks. Deep learning keyphrase generation methods often combine the copy and generating action-aware probabilities to model keyphrase accuracy, ignoring the copy \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Li:2024:UCM, author = "Jiahong Li and Chenda Li and Yifei Wu and Yanmin Qian", title = "Unified Cross-Modal Attention: Robust Audio-Visual Speech Recognition and Beyond", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1941--1953", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3375641", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3375641", abstract = "Audio- Visual Speech Recognition (AVSR) is a promising approach to improving the accuracy and robustness of speech recognition systems with the assistance of visual cues in challenging acoustic environments. In this paper, we present a novel audio-visual \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Fras:2024:RSS, author = "Mieszko Fra{\'s} and Konrad Kowalczyk", title = "Reverberant Source Separation Using {NTF} With Delayed Subsources and Spatial Priors", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1954--1967", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3374065", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3374065", abstract = "Speech signals recorded by distant microphones are often contaminated with room reverberation and signals of interfering speakers. This article addresses the problem of joint source separation and dereverberation using multichannel nonnegative tensor \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } @Article{Wang:2024:DCT, author = "Rui Wang and Li Li and Tomoki Toda", title = "Dual-Channel Target Speaker Extraction Based on Conditional Variational Autoencoder and Directional Information", journal = j-IEEE-ACM-TASLP, volume = "32", number = "??", pages = "1968--1979", year = "2024", DOI = "https://doi.org/10.1109/TASLP.2024.3376154", ISSN = "2329-9290", bibdate = "Fri Apr 12 09:07:41 MDT 2024", bibsource = "https://www.math.utah.edu/pub/tex/bib/ieeeacmtaslp.bib", URL = "https://dl.acm.org/doi/10.1109/TASLP.2024.3376154", abstract = "Target speaker extraction (TSE) has become an attractive research topic in recent years. However, TSE under the underdetermined conditions is still a challenge. In this paper, we deal with a dual-channel TSE problem under underdetermined conditions. \ldots{}", acknowledgement = ack-nhfb, fjournal = "IEEE\slash ACM Transactions on Audio, Speech, and Language Processing", journal-URL = "https://dl.acm.org/loi/taslp; http://ieeexplore.ieee.org/xpl/RecentIssue.jsp?punumber=6570655", } %%% [27-May-2021] TO DO: ACM has only 30 articles in volume 28, but IEEE shows 180! %%% [07-Apr-2022] v30 is incomplete (full year coverage) %%% [17-May-2023] Check contents for most recent volume: additions are made during the year; also fix bibsource data