BibTeX records: Hiroshi Saruwatari

download as .bib file

@article{DBLP:journals/access/XinJTSAS24,
  author       = {Detai Xin and
                  Junfeng Jiang and
                  Shinnosuke Takamichi and
                  Yuki Saito and
                  Akiko Aizawa and
                  Hiroshi Saruwatari},
  title        = {{JVNV:} {A} Corpus of Japanese Emotional Speech With Verbal Content
                  and Nonverbal Expressions},
  journal      = {{IEEE} Access},
  volume       = {12},
  pages        = {19752--19764},
  year         = {2024},
  url          = {https://doi.org/10.1109/ACCESS.2024.3360885},
  doi          = {10.1109/ACCESS.2024.3360885},
  timestamp    = {Sat, 16 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/access/XinJTSAS24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/speech/XinTS24,
  author       = {Detai Xin and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {{JNV} corpus: {A} corpus of Japanese nonverbal vocalizations with
                  diverse phrases and emotions},
  journal      = {Speech Commun.},
  volume       = {156},
  pages        = {103004},
  year         = {2024},
  url          = {https://doi.org/10.1016/j.specom.2023.103004},
  doi          = {10.1016/J.SPECOM.2023.103004},
  timestamp    = {Fri, 08 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/speech/XinTS24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/SaekiMLWTS24,
  author       = {Takaaki Saeki and
                  Soumi Maiti and
                  Xinjian Li and
                  Shinji Watanabe and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Text-Inductive Graphone-Based Language Adaptation for Low-Resource
                  Speech Synthesis},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {32},
  pages        = {1829--1844},
  year         = {2024},
  url          = {https://doi.org/10.1109/TASLP.2024.3369537},
  doi          = {10.1109/TASLP.2024.3369537},
  timestamp    = {Mon, 01 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/SaekiMLWTS24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2401-05809,
  author       = {Yoshihide Tomita and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Localizing Acoustic Energy in Sound Field Synthesis by Directionally
                  Weighted Exterior Radiation Suppression},
  journal      = {CoRR},
  volume       = {abs/2401.05809},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.05809},
  doi          = {10.48550/ARXIV.2401.05809},
  eprinttype    = {arXiv},
  eprint       = {2401.05809},
  timestamp    = {Fri, 26 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-05809.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2401-16812,
  author       = {Takaaki Saeki and
                  Soumi Maiti and
                  Shinnosuke Takamichi and
                  Shinji Watanabe and
                  Hiroshi Saruwatari},
  title        = {SpeechBERTScore: Reference-Aware Automatic Evaluation of Speech Generation
                  Leveraging {NLP} Evaluation Metrics},
  journal      = {CoRR},
  volume       = {abs/2401.16812},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.16812},
  doi          = {10.48550/ARXIV.2401.16812},
  eprinttype    = {arXiv},
  eprint       = {2401.16812},
  timestamp    = {Tue, 06 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-16812.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2403-12477,
  author       = {Yuto Ishikawa and
                  Kohei Konaka and
                  Tomohiko Nakamura and
                  Norihiro Takamune and
                  Hiroshi Saruwatari},
  title        = {Real-time Speech Extraction Using Spatially Regularized Independent
                  Low-rank Matrix Analysis and Rank-constrained Spatial Covariance Matrix
                  Estimation},
  journal      = {CoRR},
  volume       = {abs/2403.12477},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.12477},
  doi          = {10.48550/ARXIV.2403.12477},
  eprinttype    = {arXiv},
  eprint       = {2403.12477},
  timestamp    = {Mon, 08 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-12477.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2403-13353,
  author       = {Aya Watanabe and
                  Shinnosuke Takamichi and
                  Yuki Saito and
                  Wataru Nakata and
                  Detai Xin and
                  Hiroshi Saruwatari},
  title        = {Building speech corpus with diverse voice characteristics for its
                  prompt-based representation},
  journal      = {CoRR},
  volume       = {abs/2403.13353},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.13353},
  doi          = {10.48550/ARXIV.2403.13353},
  eprinttype    = {arXiv},
  eprint       = {2403.13353},
  timestamp    = {Mon, 08 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-13353.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/access/SaekiTNTS23,
  author       = {Takaaki Saeki and
                  Shinnosuke Takamichi and
                  Tomohiko Nakamura and
                  Naoko Tanji and
                  Hiroshi Saruwatari},
  title        = {SelfRemaster: Self-Supervised Speech Restoration for Historical Audio
                  Resources},
  journal      = {{IEEE} Access},
  volume       = {11},
  pages        = {144831--144843},
  year         = {2023},
  url          = {https://doi.org/10.1109/ACCESS.2023.3345027},
  doi          = {10.1109/ACCESS.2023.3345027},
  timestamp    = {Sat, 13 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/access/SaekiTNTS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/AbeKUS23,
  author       = {Takumi Abe and
                  Shoichi Koyama and
                  Natsuki Ueno and
                  Hiroshi Saruwatari},
  title        = {Amplitude Matching for Multizone Sound Field Control},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {31},
  pages        = {656--669},
  year         = {2023},
  url          = {https://doi.org/10.1109/TASLP.2022.3231715},
  doi          = {10.1109/TASLP.2022.3231715},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/AbeKUS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/HasumiNTSKTK23,
  author       = {Takuya Hasumi and
                  Tomohiko Nakamura and
                  Norihiro Takamune and
                  Hiroshi Saruwatari and
                  Daichi Kitamura and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {PoP-IDLMA: Product-of-Prior Independent Deeply Learned Matrix Analysis
                  for Multichannel Music Source Separation},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {31},
  pages        = {2680--2694},
  year         = {2023},
  url          = {https://doi.org/10.1109/TASLP.2023.3293044},
  doi          = {10.1109/TASLP.2023.3293044},
  timestamp    = {Tue, 12 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/HasumiNTSKTK23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/MisawaTYKS23,
  author       = {Sota Misawa and
                  Norihiro Takamune and
                  Kohei Yatabe and
                  Daichi Kitamura and
                  Hiroshi Saruwatari},
  title        = {Blind Source Separation Using Independent Low-Rank Matrix Analysis
                  with Spectrogram-Consistency Regularization},
  booktitle    = {Asia Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2023, Taipei, Taiwan, October
                  31 - Nov. 3, 2023},
  pages        = {1050--1057},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/APSIPAASC58517.2023.10317156},
  doi          = {10.1109/APSIPAASC58517.2023.10317156},
  timestamp    = {Sat, 02 Dec 2023 14:05:45 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/MisawaTYKS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/WatanabeTSNXS23,
  author       = {Aya Watanabe and
                  Shinnosuke Takamichi and
                  Yuki Saito and
                  Wataru Nakata and
                  Detai Xin and
                  Hiroshi Saruwatari},
  title        = {{COCO-NUT:} Corpus of Japanese Utterance and Voice Characteristics
                  Description for Prompt-Based Control},
  booktitle    = {{IEEE} Automatic Speech Recognition and Understanding Workshop, {ASRU}
                  2023, Taipei, Taiwan, December 16-20, 2023},
  pages        = {1--8},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ASRU57964.2023.10389693},
  doi          = {10.1109/ASRU57964.2023.10389693},
  timestamp    = {Tue, 13 Feb 2024 21:21:14 +0100},
  biburl       = {https://dblp.org/rec/conf/asru/WatanabeTSNXS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/KojimaAKS23,
  author       = {Takaaki Kojima and
                  Kazuyuki Arikawa and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Multichannel Active Noise Control with Exterior Radiation Suppression
                  Based on Riemannian Optimization},
  booktitle    = {31st European Signal Processing Conference, {EUSIPCO} 2023, Helsinki,
                  Finland, September 4-8, 2023},
  pages        = {96--100},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.23919/EUSIPCO58844.2023.10289919},
  doi          = {10.23919/EUSIPCO58844.2023.10289919},
  timestamp    = {Mon, 06 Nov 2023 12:35:15 +0100},
  biburl       = {https://dblp.org/rec/conf/eusipco/KojimaAKS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/ImamuraNTYS23,
  author       = {Kanami Imamura and
                  Tomohiko Nakamura and
                  Norihiro Takamune and
                  Kohei Yatabe and
                  Hiroshi Saruwatari},
  title        = {Algorithms of Sampling-Frequency-Independent Layers for Non-integer
                  Strides},
  booktitle    = {31st European Signal Processing Conference, {EUSIPCO} 2023, Helsinki,
                  Finland, September 4-8, 2023},
  pages        = {326--330},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.23919/EUSIPCO58844.2023.10289819},
  doi          = {10.23919/EUSIPCO58844.2023.10289819},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eusipco/ImamuraNTYS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/NishidaTIKSN23,
  author       = {Koki Nishida and
                  Norihiro Takamune and
                  Rintaro Ikeshita and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Tomohiro Nakatani},
  title        = {NoisyILRMA: Diffuse-Noise-Aware Independent Low-Rank Matrix Analysis
                  for Fast Blind Source Extraction},
  booktitle    = {31st European Signal Processing Conference, {EUSIPCO} 2023, Helsinki,
                  Finland, September 4-8, 2023},
  pages        = {925--929},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.23919/EUSIPCO58844.2023.10289863},
  doi          = {10.23919/EUSIPCO58844.2023.10289863},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eusipco/NishidaTIKSN23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ArikawaKS23,
  author       = {Kazuyuki Arikawa and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Spatial Active Noise Control Method Based on Sound Field Interpolation
                  from Reference Microphone Signals},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10097189},
  doi          = {10.1109/ICASSP49357.2023.10097189},
  timestamp    = {Sun, 05 Nov 2023 16:51:21 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/ArikawaKS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/NakamuraTTFS23,
  author       = {Tomohiko Nakamura and
                  Shinnosuke Takamichi and
                  Naoko Tanji and
                  Satoru Fukayama and
                  Hiroshi Saruwatari},
  title        = {jaCappella Corpus: {A} Japanese a Cappella Vocal Ensemble Corpus},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10095569},
  doi          = {10.1109/ICASSP49357.2023.10095569},
  timestamp    = {Fri, 10 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/NakamuraTTFS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/OhnakaTIOFS23,
  author       = {Hien Ohnaka and
                  Shinnosuke Takamichi and
                  Keisuke Imoto and
                  Yuki Okamoto and
                  Kazuki Fujii and
                  Hiroshi Saruwatari},
  title        = {Visual Onoma-to-Wave: Environmental Sound Synthesis from Visual Onomatopoeias
                  and Sound-Source Images},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10096517},
  doi          = {10.1109/ICASSP49357.2023.10096517},
  timestamp    = {Sun, 05 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/OhnakaTIOFS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/RibeiroKS23,
  author       = {Juliano G. C. Ribeiro and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Kernel Interpolation of Acoustic Transfer Functions with Adaptive
                  Kernel for Directed and Residual Reverberations},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10095429},
  doi          = {10.1109/ICASSP49357.2023.10095429},
  timestamp    = {Sun, 05 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/RibeiroKS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/WatanabeTSXS23,
  author       = {Aya Watanabe and
                  Shinnosuke Takamichi and
                  Yuki Saito and
                  Detai Xin and
                  Hiroshi Saruwatari},
  title        = {MID-Attribute Speaker Generation Using Optimal-Transport-Based Interpolation
                  of Gaussian Mixture Models},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10097113},
  doi          = {10.1109/ICASSP49357.2023.10097113},
  timestamp    = {Sun, 05 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/WatanabeTSXS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/XinAAKTS23,
  author       = {Detai Xin and
                  Sharath Adavanne and
                  Federico Ang and
                  Ashish Kulkarni and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Improving Speech Prosody of Audiobook Text-To-Speech Synthesis with
                  Acoustic and Textual Contexts},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10096247},
  doi          = {10.1109/ICASSP49357.2023.10096247},
  timestamp    = {Sun, 05 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/XinAAKTS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/YangKSSXS23,
  author       = {Dong Yang and
                  Tomoki Koriyama and
                  Yuki Saito and
                  Takaaki Saeki and
                  Detai Xin and
                  Hiroshi Saruwatari},
  title        = {Duration-Aware Pause Insertion Using Pre-Trained Language Model for
                  Multi-Speaker Text-To-Speech},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10096402},
  doi          = {10.1109/ICASSP49357.2023.10096402},
  timestamp    = {Sun, 05 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/YangKSSXS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/SaekiML0TS23,
  author       = {Takaaki Saeki and
                  Soumi Maiti and
                  Xinjian Li and
                  Shinji Watanabe and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Learning to Speak from Text: Zero-Shot Multilingual Text-to-Speech
                  with Unsupervised Text Pretraining},
  booktitle    = {Proceedings of the Thirty-Second International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2023, 19th-25th August 2023, Macao,
                  SAR, China},
  pages        = {5179--5187},
  publisher    = {ijcai.org},
  year         = {2023},
  url          = {https://doi.org/10.24963/ijcai.2023/575},
  doi          = {10.24963/IJCAI.2023/575},
  timestamp    = {Mon, 28 Aug 2023 17:23:07 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/SaekiML0TS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/waspaa/KimuraKS23,
  author       = {Keisuke Kimura and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Perceptual Quality Enhancement of Sound Field Synthesis Based on Combination
                  of Pressure and Amplitude Matching},
  booktitle    = {{IEEE} Workshop on Applications of Signal Processing to Audio and
                  Acoustics, {WASPAA} 2023, New Paltz, NY, USA, October 22-25, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/WASPAA58266.2023.10248106},
  doi          = {10.1109/WASPAA58266.2023.10248106},
  timestamp    = {Sat, 23 Sep 2023 11:31:10 +0200},
  biburl       = {https://dblp.org/rec/conf/waspaa/KimuraKS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/waspaa/KoyamaNRS23,
  author       = {Shoichi Koyama and
                  Masaki Nakada and
                  Juliano G. C. Ribeiro and
                  Hiroshi Saruwatari},
  title        = {Kernel Interpolation of Incident Sound Field in Region Including Scattering
                  Objects},
  booktitle    = {{IEEE} Workshop on Applications of Signal Processing to Audio and
                  Acoustics, {WASPAA} 2023, New Paltz, NY, USA, October 22-25, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/WASPAA58266.2023.10248156},
  doi          = {10.1109/WASPAA58266.2023.10248156},
  timestamp    = {Sat, 23 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/waspaa/KoyamaNRS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-12596,
  author       = {Takaaki Saeki and
                  Soumi Maiti and
                  Xinjian Li and
                  Shinji Watanabe and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Learning to Speak from Text: Zero-Shot Multilingual Text-to-Speech
                  with Unsupervised Text Pretraining},
  journal      = {CoRR},
  volume       = {abs/2301.12596},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.12596},
  doi          = {10.48550/ARXIV.2301.12596},
  eprinttype    = {arXiv},
  eprint       = {2301.12596},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-12596.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-13652,
  author       = {Dong Yang and
                  Tomoki Koriyama and
                  Yuki Saito and
                  Takaaki Saeki and
                  Detai Xin and
                  Hiroshi Saruwatari},
  title        = {Duration-aware pause insertion using pre-trained language model for
                  multi-speaker text-to-speech},
  journal      = {CoRR},
  volume       = {abs/2302.13652},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.13652},
  doi          = {10.48550/ARXIV.2302.13652},
  eprinttype    = {arXiv},
  eprint       = {2302.13652},
  timestamp    = {Tue, 28 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-13652.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2303-03869,
  author       = {Juliano G. C. Ribeiro and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Kernel interpolation of acoustic transfer functions with adaptive
                  kernel for directed and residual reverberations},
  journal      = {CoRR},
  volume       = {abs/2303.03869},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.03869},
  doi          = {10.48550/ARXIV.2303.03869},
  eprinttype    = {arXiv},
  eprint       = {2303.03869},
  timestamp    = {Thu, 16 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-03869.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2303-16021,
  author       = {Kazuyuki Arikawa and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Spatial Active Noise Control Method Based On Sound Field Interpolation
                  From Reference Microphone Signals},
  journal      = {CoRR},
  volume       = {abs/2303.16021},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.16021},
  doi          = {10.48550/ARXIV.2303.16021},
  eprinttype    = {arXiv},
  eprint       = {2303.16021},
  timestamp    = {Thu, 13 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-16021.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-12442,
  author       = {Detai Xin and
                  Shinnosuke Takamichi and
                  Ai Morimatsu and
                  Hiroshi Saruwatari},
  title        = {Laughter Synthesis using Pseudo Phonetic Tokens with a Large-scale
                  In-the-wild Laughter Corpus},
  journal      = {CoRR},
  volume       = {abs/2305.12442},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.12442},
  doi          = {10.48550/ARXIV.2305.12442},
  eprinttype    = {arXiv},
  eprint       = {2305.12442},
  timestamp    = {Fri, 26 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-12442.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-12445,
  author       = {Detai Xin and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {{JNV} Corpus: {A} Corpus of Japanese Nonverbal Vocalizations with
                  Diverse Phrases and Emotions},
  journal      = {CoRR},
  volume       = {abs/2305.12445},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.12445},
  doi          = {10.48550/ARXIV.2305.12445},
  eprinttype    = {arXiv},
  eprint       = {2305.12445},
  timestamp    = {Fri, 26 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-12445.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-13713,
  author       = {Yuki Saito and
                  Eiji Iimori and
                  Shinnosuke Takamichi and
                  Kentaro Tachibana and
                  Hiroshi Saruwatari},
  title        = {{CALLS:} Japanese Empathetic Dialogue Speech Corpus of Complaint Handling
                  and Attentive Listening in Customer Center},
  journal      = {CoRR},
  volume       = {abs/2305.13713},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.13713},
  doi          = {10.48550/ARXIV.2305.13713},
  eprinttype    = {arXiv},
  eprint       = {2305.13713},
  timestamp    = {Mon, 05 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-13713.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-13724,
  author       = {Yuki Saito and
                  Shinnosuke Takamichi and
                  Eiji Iimori and
                  Kentaro Tachibana and
                  Hiroshi Saruwatari},
  title        = {ChatGPT-EDSS: Empathetic Dialogue Speech Synthesis Trained from ChatGPT-derived
                  Context Word Embeddings},
  journal      = {CoRR},
  volume       = {abs/2305.13724},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.13724},
  doi          = {10.48550/ARXIV.2305.13724},
  eprinttype    = {arXiv},
  eprint       = {2305.13724},
  timestamp    = {Mon, 05 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-13724.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-00697,
  author       = {Joonyong Park and
                  Shinnosuke Takamichi and
                  Tomohiko Nakamura and
                  Kentaro Seki and
                  Detai Xin and
                  Hiroshi Saruwatari},
  title        = {How Generative Spoken Language Modeling Encodes Noisy Speech: Investigation
                  from Phonetics to Syntactics},
  journal      = {CoRR},
  volume       = {abs/2306.00697},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.00697},
  doi          = {10.48550/ARXIV.2306.00697},
  eprinttype    = {arXiv},
  eprint       = {2306.00697},
  timestamp    = {Mon, 12 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-00697.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-08855,
  author       = {Takaaki Kojima and
                  Kazuyuki Arikawa and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Multichannel Active Noise Control with Exterior Radiation Suppression
                  Based on Riemannian Optimization},
  journal      = {CoRR},
  volume       = {abs/2306.08855},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.08855},
  doi          = {10.48550/ARXIV.2306.08855},
  eprinttype    = {arXiv},
  eprint       = {2306.08855},
  timestamp    = {Mon, 19 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-08855.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-10718,
  author       = {Kanami Imamura and
                  Tomohiko Nakamura and
                  Norihiro Takamune and
                  Kohei Yatabe and
                  Hiroshi Saruwatari},
  title        = {Algorithms of Sampling-Frequency-Independent Layers for Non-integer
                  Strides},
  journal      = {CoRR},
  volume       = {abs/2306.10718},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.10718},
  doi          = {10.48550/ARXIV.2306.10718},
  eprinttype    = {arXiv},
  eprint       = {2306.10718},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-10718.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-12169,
  author       = {Yota Ueda and
                  Shinnosuke Takamichi and
                  Yuki Saito and
                  Norihiro Takamune and
                  Hiroshi Saruwatari},
  title        = {HumanDiffusion: diffusion model using perceptual gradients},
  journal      = {CoRR},
  volume       = {abs/2306.12169},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.12169},
  doi          = {10.48550/ARXIV.2306.12169},
  eprinttype    = {arXiv},
  eprint       = {2306.12169},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-12169.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-12820,
  author       = {Koki Nishida and
                  Norihiro Takamune and
                  Rintaro Ikeshita and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Tomohiro Nakatani},
  title        = {NoisyILRMA: Diffuse-Noise-Aware Independent Low-Rank Matrix Analysis
                  for Fast Blind Source Extraction},
  journal      = {CoRR},
  volume       = {abs/2306.12820},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.12820},
  doi          = {10.48550/ARXIV.2306.12820},
  eprinttype    = {arXiv},
  eprint       = {2306.12820},
  timestamp    = {Tue, 27 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-12820.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-13941,
  author       = {Keisuke Kimura and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Perceptual Quality Enhancement of Sound Field Synthesis Based on Combination
                  of Pressure and Amplitude Matching},
  journal      = {CoRR},
  volume       = {abs/2307.13941},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.13941},
  doi          = {10.48550/ARXIV.2307.13941},
  eprinttype    = {arXiv},
  eprint       = {2307.13941},
  timestamp    = {Tue, 01 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-13941.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-05634,
  author       = {Shoichi Koyama and
                  Masaki Nakada and
                  Juliano G. C. Ribeiro and
                  Hiroshi Saruwatari},
  title        = {Kernel Interpolation of Incident Sound Field in Region Including Scattering
                  Objects},
  journal      = {CoRR},
  volume       = {abs/2309.05634},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.05634},
  doi          = {10.48550/ARXIV.2309.05634},
  eprinttype    = {arXiv},
  eprint       = {2309.05634},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-05634.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-08127,
  author       = {Kentaro Seki and
                  Shinnosuke Takamichi and
                  Takaaki Saeki and
                  Hiroshi Saruwatari},
  title        = {Diversity-based core-set selection for text-to-speech with linguistic
                  and acoustic features},
  journal      = {CoRR},
  volume       = {abs/2309.08127},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.08127},
  doi          = {10.48550/ARXIV.2309.08127},
  eprinttype    = {arXiv},
  eprint       = {2309.08127},
  timestamp    = {Fri, 22 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-08127.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-09690,
  author       = {Shinnosuke Takamichi and
                  Hiroki Maeda and
                  Joonyong Park and
                  Daisuke Saito and
                  Hiroshi Saruwatari},
  title        = {Do learned speech symbols follow Zipf's law?},
  journal      = {CoRR},
  volume       = {abs/2309.09690},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.09690},
  doi          = {10.48550/ARXIV.2309.09690},
  eprinttype    = {arXiv},
  eprint       = {2309.09690},
  timestamp    = {Fri, 22 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-09690.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-13509,
  author       = {Aya Watanabe and
                  Shinnosuke Takamichi and
                  Yuki Saito and
                  Wataru Nakata and
                  Detai Xin and
                  Hiroshi Saruwatari},
  title        = {Coco-Nut: Corpus of Japanese Utterance and Voice Characteristics Description
                  for Prompt-based Control},
  journal      = {CoRR},
  volume       = {abs/2309.13509},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.13509},
  doi          = {10.48550/ARXIV.2309.13509},
  eprinttype    = {arXiv},
  eprint       = {2309.13509},
  timestamp    = {Wed, 27 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-13509.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-06072,
  author       = {Detai Xin and
                  Junfeng Jiang and
                  Shinnosuke Takamichi and
                  Yuki Saito and
                  Akiko Aizawa and
                  Hiroshi Saruwatari},
  title        = {{JVNV:} {A} Corpus of Japanese Emotional Speech with Verbal Content
                  and Nonverbal Expressions},
  journal      = {CoRR},
  volume       = {abs/2310.06072},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.06072},
  doi          = {10.48550/ARXIV.2310.06072},
  eprinttype    = {arXiv},
  eprint       = {2310.06072},
  timestamp    = {Tue, 24 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-06072.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ejasp/KondoKTKS22,
  author       = {Yuto Kondo and
                  Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari},
  title        = {Deficient-basis-complementary rank-constrained spatial covariance
                  matrix estimation based on multivariate generalized Gaussian distribution
                  for blind speech extraction},
  journal      = {{EURASIP} J. Adv. Signal Process.},
  volume       = {2022},
  number       = {1},
  pages        = {88},
  year         = {2022},
  url          = {https://doi.org/10.1186/s13634-022-00905-z},
  doi          = {10.1186/S13634-022-00905-Z},
  timestamp    = {Mon, 05 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ejasp/KondoKTKS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/SaitoNYS22,
  author       = {Koichi Saito and
                  Tomohiko Nakamura and
                  Kohei Yatabe and
                  Hiroshi Saruwatari},
  title        = {Sampling-Frequency-Independent Convolutional Layer and its Application
                  to Audio Source Separation},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {30},
  pages        = {2928--2943},
  year         = {2022},
  url          = {https://doi.org/10.1109/TASLP.2022.3203907},
  doi          = {10.1109/TASLP.2022.3203907},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/SaitoNYS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/RibeiroUKS22,
  author       = {Juliano G. C. Ribeiro and
                  Natsuki Ueno and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Region-to-Region Kernel Interpolation of Acoustic Transfer Functions
                  Constrained by Physical Properties},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {30},
  pages        = {2944--2954},
  year         = {2022},
  url          = {https://doi.org/10.1109/TASLP.2022.3201368},
  doi          = {10.1109/TASLP.2022.3201368},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/RibeiroUKS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tsp/NishidaUKS22,
  author       = {Tomoya Nishida and
                  Natsuki Ueno and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Region-Restricted Sensor Placement Based on Gaussian Process for Sound
                  Field Estimation},
  journal      = {{IEEE} Trans. Signal Process.},
  volume       = {70},
  pages        = {1718--1733},
  year         = {2022},
  url          = {https://doi.org/10.1109/TSP.2022.3156012},
  doi          = {10.1109/TSP.2022.3156012},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tsp/NishidaUKS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/RibeiroKS22,
  author       = {Juliano G. C. Ribeiro and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Region-to-Region Kernel Interpolation of Acoustic Transfer Function
                  with Directional Weighting},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2022, Virtual and Singapore, 23-27 May 2022},
  pages        = {576--580},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/ICASSP43922.2022.9746842},
  doi          = {10.1109/ICASSP43922.2022.9746842},
  timestamp    = {Tue, 07 Jun 2022 17:34:47 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/RibeiroKS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KawamuraNKSTK22,
  author       = {Masaya Kawamura and
                  Tomohiko Nakamura and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Differentiable Digital Signal Processing Mixture Model for Synthesis
                  Parameter Extraction from Mixture of Harmonic Sounds},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2022, Virtual and Singapore, 23-27 May 2022},
  pages        = {941--945},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/ICASSP43922.2022.9746399},
  doi          = {10.1109/ICASSP43922.2022.9746399},
  timestamp    = {Thu, 23 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KawamuraNKSTK22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ArikawaKS22,
  author       = {Kazuyuki Arikawa and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Spatial Active Noise Control Based on Individual Kernel Interpolation
                  of Primary and Secondary Sound Fields},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2022, Virtual and Singapore, 23-27 May 2022},
  pages        = {1056--1060},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/ICASSP43922.2022.9746065},
  doi          = {10.1109/ICASSP43922.2022.9746065},
  timestamp    = {Tue, 07 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ArikawaKS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/TakamichiNTS22,
  author       = {Shinnosuke Takamichi and
                  Wataru Nakata and
                  Naoko Tanji and
                  Hiroshi Saruwatari},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {{J-MAC:} Japanese multi-speaker audiobook corpus for speech synthesis},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {2358--2362},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-444},
  doi          = {10.21437/INTERSPEECH.2022-444},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/TakamichiNTS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/UdagawaSS22,
  author       = {Kenta Udagawa and
                  Yuki Saito and
                  Hiroshi Saruwatari},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {Human-in-the-loop Speaker Adaptation for DNN-based Multi-speaker {TTS}},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {2968--2972},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-257},
  doi          = {10.21437/INTERSPEECH.2022-257},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/UdagawaSS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/NishimuraSTTS22,
  author       = {Yuto Nishimura and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Kentaro Tachibana and
                  Hiroshi Saruwatari},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {Acoustic Modeling for End-to-End Empathetic Dialogue Speech Synthesis
                  Using Linguistic and Prosodic Contexts of Dialogue History},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {3373--3377},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-403},
  doi          = {10.21437/INTERSPEECH.2022-403},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/NishimuraSTTS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SaekiTNTS22,
  author       = {Takaaki Saeki and
                  Shinnosuke Takamichi and
                  Tomohiko Nakamura and
                  Naoko Tanji and
                  Hiroshi Saruwatari},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {SelfRemaster: Self-Supervised Speech Restoration with Analysis-by-Synthesis
                  Approach Using Channel Modeling},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {4406--4410},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-298},
  doi          = {10.21437/INTERSPEECH.2022-298},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SaekiTNTS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SaekiXNKTS22,
  author       = {Takaaki Saeki and
                  Detai Xin and
                  Wataru Nakata and
                  Tomoki Koriyama and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {{UTMOS:} UTokyo-SaruLab System for VoiceMOS Challenge 2022},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {4521--4525},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-439},
  doi          = {10.21437/INTERSPEECH.2022-439},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SaekiXNKTS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/NakataKTSIMS22,
  author       = {Wataru Nakata and
                  Tomoki Koriyama and
                  Shinnosuke Takamichi and
                  Yuki Saito and
                  Yusuke Ijima and
                  Ryo Masumura and
                  Hiroshi Saruwatari},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {Predicting VQVAE-based Character Acting Style from Quotation-Annotated
                  Text for Audiobook Speech Synthesis},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {4551--4555},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-638},
  doi          = {10.21437/INTERSPEECH.2022-638},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/NakataKTSIMS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SaitoNTTS22,
  author       = {Yuki Saito and
                  Yuto Nishimura and
                  Shinnosuke Takamichi and
                  Kentaro Tachibana and
                  Hiroshi Saruwatari},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {{STUDIES:} Corpus of Japanese Empathetic Dialogue Speech Towards Friendly
                  Voice Agent},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {5155--5159},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-300},
  doi          = {10.21437/INTERSPEECH.2022-300},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SaitoNTTS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwaenc/ItoNKS22,
  author       = {Yuki Ito and
                  Tomohiko Nakamura and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Head-Related Transfer Function Interpolation From Spatially Sparse
                  Measurements Using Autoencoder With Source Position Conditioning},
  booktitle    = {17th International Workshop on Acoustic Signal Enhancement, {IWAENC}
                  2022, Bamberg, Germany, September 5-8, 2022},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/IWAENC53105.2022.9914751},
  doi          = {10.1109/IWAENC53105.2022.9914751},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iwaenc/ItoNKS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwaenc/ShigemiKNS22,
  author       = {Kazuhide Shigemi and
                  Shoichi Koyama and
                  Tomohiko Nakamura and
                  Hiroshi Saruwatari},
  title        = {Physics-Informed Convolutional Neural Network with Bicubic Spline
                  Interpolation for Sound Field Estimation},
  booktitle    = {17th International Workshop on Acoustic Signal Enhancement, {IWAENC}
                  2022, Bamberg, Germany, September 5-8, 2022},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/IWAENC53105.2022.9914792},
  doi          = {10.1109/IWAENC53105.2022.9914792},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iwaenc/ShigemiKNS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lrec/MatsunagaSTS22,
  author       = {Yuta Matsunaga and
                  Takaaki Saeki and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  editor       = {Nicoletta Calzolari and
                  Fr{\'{e}}d{\'{e}}ric B{\'{e}}chet and
                  Philippe Blache and
                  Khalid Choukri and
                  Christopher Cieri and
                  Thierry Declerck and
                  Sara Goggi and
                  Hitoshi Isahara and
                  Bente Maegaard and
                  Joseph Mariani and
                  H{\'{e}}l{\`{e}}ne Mazo and
                  Jan Odijk and
                  Stelios Piperidis},
  title        = {Personalized Filled-pause Generation with Group-wise Prediction Models},
  booktitle    = {Proceedings of the Thirteenth Language Resources and Evaluation Conference,
                  {LREC} 2022, Marseille, France, 20-25 June 2022},
  pages        = {385--392},
  publisher    = {European Language Resources Association},
  year         = {2022},
  url          = {https://aclanthology.org/2022.lrec-1.40},
  timestamp    = {Mon, 10 Oct 2022 16:57:52 +0200},
  biburl       = {https://dblp.org/rec/conf/lrec/MatsunagaSTS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/NakanoSTSS22,
  author       = {Yoshifumi Nakano and
                  Takaaki Saeki and
                  Shinnosuke Takamichi and
                  Katsuhito Sudoh and
                  Hiroshi Saruwatari},
  title        = {{VTTS:} Visual-Text To Speech},
  booktitle    = {{IEEE} Spoken Language Technology Workshop, {SLT} 2022, Doha, Qatar,
                  January 9-12, 2023},
  pages        = {936--942},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/SLT54892.2023.10022739},
  doi          = {10.1109/SLT54892.2023.10022739},
  timestamp    = {Mon, 06 Feb 2023 22:19:30 +0100},
  biburl       = {https://dblp.org/rec/conf/slt/NakanoSTSS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-10896,
  author       = {Shinnosuke Takamichi and
                  Wataru Nakata and
                  Naoko Tanji and
                  Hiroshi Saruwatari},
  title        = {{J-MAC:} Japanese multi-speaker audiobook corpus for speech synthesis},
  journal      = {CoRR},
  volume       = {abs/2201.10896},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.10896},
  eprinttype    = {arXiv},
  eprint       = {2201.10896},
  timestamp    = {Tue, 01 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-10896.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-00200,
  author       = {Masaya Kawamura and
                  Tomohiko Nakamura and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Differentiable Digital Signal Processing Mixture Model for Synthesis
                  Parameter Extraction from Mixture of Harmonic Sounds},
  journal      = {CoRR},
  volume       = {abs/2202.00200},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.00200},
  eprinttype    = {arXiv},
  eprint       = {2202.00200},
  timestamp    = {Wed, 09 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-00200.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-04807,
  author       = {Kazuyuki Arikawa and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Spatial active noise control based on individual kernel interpolation
                  of primary and secondary sound fields},
  journal      = {CoRR},
  volume       = {abs/2202.04807},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.04807},
  eprinttype    = {arXiv},
  eprint       = {2202.04807},
  timestamp    = {Tue, 01 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-04807.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-09961,
  author       = {Yuta Matsunaga and
                  Takaaki Saeki and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Personalized filled-pause generation with group-wise prediction models},
  journal      = {CoRR},
  volume       = {abs/2203.09961},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.09961},
  doi          = {10.48550/ARXIV.2203.09961},
  eprinttype    = {arXiv},
  eprint       = {2203.09961},
  timestamp    = {Mon, 28 Mar 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-09961.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-12937,
  author       = {Takaaki Saeki and
                  Shinnosuke Takamichi and
                  Tomohiko Nakamura and
                  Naoko Tanji and
                  Hiroshi Saruwatari},
  title        = {SelfRemaster: Self-Supervised Speech Restoration with Analysis-by-Synthesis
                  Approach Using Channel Modeling},
  journal      = {CoRR},
  volume       = {abs/2203.12937},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.12937},
  doi          = {10.48550/ARXIV.2203.12937},
  eprinttype    = {arXiv},
  eprint       = {2203.12937},
  timestamp    = {Tue, 29 Mar 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-12937.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-14725,
  author       = {Yoshifumi Nakano and
                  Takaaki Saeki and
                  Shinnosuke Takamichi and
                  Katsuhito Sudoh and
                  Hiroshi Saruwatari},
  title        = {vTTS: visual-text to speech},
  journal      = {CoRR},
  volume       = {abs/2203.14725},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.14725},
  doi          = {10.48550/ARXIV.2203.14725},
  eprinttype    = {arXiv},
  eprint       = {2203.14725},
  timestamp    = {Mon, 04 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-14725.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-14757,
  author       = {Yuki Saito and
                  Yuto Nishimura and
                  Shinnosuke Takamichi and
                  Kentaro Tachibana and
                  Hiroshi Saruwatari},
  title        = {{STUDIES:} Corpus of Japanese Empathetic Dialogue Speech Towards Friendly
                  Voice Agent},
  journal      = {CoRR},
  volume       = {abs/2203.14757},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.14757},
  doi          = {10.48550/ARXIV.2203.14757},
  eprinttype    = {arXiv},
  eprint       = {2203.14757},
  timestamp    = {Mon, 04 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-14757.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-02152,
  author       = {Takaaki Saeki and
                  Detai Xin and
                  Wataru Nakata and
                  Tomoki Koriyama and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {{UTMOS:} UTokyo-SaruLab System for VoiceMOS Challenge 2022},
  journal      = {CoRR},
  volume       = {abs/2204.02152},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.02152},
  doi          = {10.48550/ARXIV.2204.02152},
  eprinttype    = {arXiv},
  eprint       = {2204.02152},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-02152.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-10561,
  author       = {Detai Xin and
                  Shinnosuke Takamichi and
                  Takuma Okamoto and
                  Hisashi Kawai and
                  Hiroshi Saruwatari},
  title        = {Speaking-Rate-Controllable HiFi-GAN Using Feature Interpolation},
  journal      = {CoRR},
  volume       = {abs/2204.10561},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.10561},
  doi          = {10.48550/ARXIV.2204.10561},
  eprinttype    = {arXiv},
  eprint       = {2204.10561},
  timestamp    = {Mon, 25 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-10561.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-08039,
  author       = {Yuto Nishimura and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Kentaro Tachibana and
                  Hiroshi Saruwatari},
  title        = {Acoustic Modeling for End-to-End Empathetic Dialogue Speech Synthesis
                  Using Linguistic and Prosodic Contexts of Dialogue History},
  journal      = {CoRR},
  volume       = {abs/2206.08039},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.08039},
  doi          = {10.48550/ARXIV.2206.08039},
  eprinttype    = {arXiv},
  eprint       = {2206.08039},
  timestamp    = {Tue, 21 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-08039.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-10256,
  author       = {Kenta Udagawa and
                  Yuki Saito and
                  Hiroshi Saruwatari},
  title        = {Human-in-the-loop Speaker Adaptation for DNN-based Multi-speaker {TTS}},
  journal      = {CoRR},
  volume       = {abs/2206.10256},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.10256},
  doi          = {10.48550/ARXIV.2206.10256},
  eprinttype    = {arXiv},
  eprint       = {2206.10256},
  timestamp    = {Mon, 27 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-10256.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-10695,
  author       = {Detai Xin and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Exploring the Effectiveness of Self-supervised Learning and Classifier
                  Chains in Emotion Recognition of Nonverbal Vocalizations},
  journal      = {CoRR},
  volume       = {abs/2206.10695},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.10695},
  doi          = {10.48550/ARXIV.2206.10695},
  eprinttype    = {arXiv},
  eprint       = {2206.10695},
  timestamp    = {Mon, 27 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-10695.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-10937,
  author       = {Kazuhide Shigemi and
                  Shoichi Koyama and
                  Tomohiko Nakamura and
                  Hiroshi Saruwatari},
  title        = {Physics-informed convolutional neural network with bicubic spline
                  interpolation for sound field estimation},
  journal      = {CoRR},
  volume       = {abs/2207.10937},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.10937},
  doi          = {10.48550/ARXIV.2207.10937},
  eprinttype    = {arXiv},
  eprint       = {2207.10937},
  timestamp    = {Mon, 25 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-10937.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-10967,
  author       = {Yuki Ito and
                  Tomohiko Nakamura and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Head-Related Transfer Function Interpolation from Spatially Sparse
                  Measurements Using Autoencoder with Source Position Conditioning},
  journal      = {CoRR},
  volume       = {abs/2207.10967},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.10967},
  doi          = {10.48550/ARXIV.2207.10967},
  eprinttype    = {arXiv},
  eprint       = {2207.10967},
  timestamp    = {Mon, 25 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-10967.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-12549,
  author       = {Yusuke Nakai and
                  Yuki Saito and
                  Kenta Udagawa and
                  Hiroshi Saruwatari},
  title        = {Multi-Task Adversarial Training Algorithm for Multi-Speaker Neural
                  Text-to-Speech},
  journal      = {CoRR},
  volume       = {abs/2209.12549},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.12549},
  doi          = {10.48550/ARXIV.2209.12549},
  eprinttype    = {arXiv},
  eprint       = {2209.12549},
  timestamp    = {Thu, 06 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-12549.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-07559,
  author       = {Yuta Matsunaga and
                  Takaaki Saeki and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Empirical Study Incorporating Linguistic Knowledge on Filled Pauses
                  for Personalized Spontaneous Speech Synthesis},
  journal      = {CoRR},
  volume       = {abs/2210.07559},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.07559},
  doi          = {10.48550/ARXIV.2210.07559},
  eprinttype    = {arXiv},
  eprint       = {2210.07559},
  timestamp    = {Tue, 18 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-07559.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-09173,
  author       = {Hien Ohnaka and
                  Shinnosuke Takamichi and
                  Keisuke Imoto and
                  Yuki Okamoto and
                  Kazuki Fujii and
                  Hiroshi Saruwatari},
  title        = {Visual onoma-to-wave: environmental sound synthesis from visual onomatopoeias
                  and sound-source images},
  journal      = {CoRR},
  volume       = {abs/2210.09173},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.09173},
  doi          = {10.48550/ARXIV.2210.09173},
  eprinttype    = {arXiv},
  eprint       = {2210.09173},
  timestamp    = {Wed, 19 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-09173.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-09815,
  author       = {Yuta Matsunaga and
                  Takaaki Saeki and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Spontaneous speech synthesis with linguistic-speech consistency training
                  using pseudo-filled pauses},
  journal      = {CoRR},
  volume       = {abs/2210.09815},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.09815},
  doi          = {10.48550/ARXIV.2210.09815},
  eprinttype    = {arXiv},
  eprint       = {2210.09815},
  timestamp    = {Mon, 24 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-09815.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-09916,
  author       = {Aya Watanabe and
                  Shinnosuke Takamichi and
                  Yuki Saito and
                  Detai Xin and
                  Hiroshi Saruwatari},
  title        = {Mid-attribute speaker generation using optimal-transport-based interpolation
                  of Gaussian mixture models},
  journal      = {CoRR},
  volume       = {abs/2210.09916},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.09916},
  doi          = {10.48550/ARXIV.2210.09916},
  eprinttype    = {arXiv},
  eprint       = {2210.09916},
  timestamp    = {Mon, 24 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-09916.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-14850,
  author       = {Kentaro Seki and
                  Shinnosuke Takamichi and
                  Takaaki Saeki and
                  Hiroshi Saruwatari},
  title        = {Text-to-speech synthesis from dark data with evaluation-in-the-loop
                  data selection},
  journal      = {CoRR},
  volume       = {abs/2210.14850},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.14850},
  doi          = {10.48550/ARXIV.2210.14850},
  eprinttype    = {arXiv},
  eprint       = {2210.14850},
  timestamp    = {Wed, 02 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-14850.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-02336,
  author       = {Detai Xin and
                  Sharath Adavanne and
                  Federico Ang and
                  Ashish Kulkarni and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Improving Speech Prosody of Audiobook Text-to-Speech Synthesis with
                  Acoustic and Textual Contexts},
  journal      = {CoRR},
  volume       = {abs/2211.02336},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.02336},
  doi          = {10.48550/ARXIV.2211.02336},
  eprinttype    = {arXiv},
  eprint       = {2211.02336},
  timestamp    = {Wed, 09 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-02336.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-16028,
  author       = {Tomohiko Nakamura and
                  Shinnosuke Takamichi and
                  Naoko Tanji and
                  Satoru Fukayama and
                  Hiroshi Saruwatari},
  title        = {jaCappella Corpus: {A} Japanese a Cappella Vocal Ensemble Corpus},
  journal      = {CoRR},
  volume       = {abs/2211.16028},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.16028},
  doi          = {10.48550/ARXIV.2211.16028},
  eprinttype    = {arXiv},
  eprint       = {2211.16028},
  timestamp    = {Fri, 02 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-16028.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieiceta/UenoKS21,
  author       = {Natsuki Ueno and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Convex and Differentiable Formulation for Inverse Problems in Hilbert
                  Spaces with Nonlinear Clipping Effects},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {104-A},
  number       = {9},
  pages        = {1293--1303},
  year         = {2021},
  url          = {https://doi.org/10.1587/transfun.2021eap1004},
  doi          = {10.1587/TRANSFUN.2021EAP1004},
  timestamp    = {Thu, 12 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieiceta/UenoKS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicetd/AibaYKTS21,
  author       = {Akihito Aiba and
                  Minoru Yoshida and
                  Daichi Kitamura and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Noise Robust Acoustic Anomaly Detection System with Nonnegative Matrix
                  Factorization Based on Generalized Gaussian Distribution},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {104-D},
  number       = {3},
  pages        = {441--449},
  year         = {2021},
  url          = {http://search.ieice.org/bin/summary.php?id=e104-d\_3\_441},
  timestamp    = {Mon, 17 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicetd/AibaYKTS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicetd/SaekiSTS21,
  author       = {Takaaki Saeki and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Real-Time Full-Band Voice Conversion with Sub-Band Modeling and Data-Driven
                  Phase Estimation of Spectral Differentials},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {104-D},
  number       = {7},
  pages        = {1002--1016},
  year         = {2021},
  url          = {https://doi.org/10.1587/transinf.2020edp7252},
  doi          = {10.1587/TRANSINF.2020EDP7252},
  timestamp    = {Thu, 12 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicetd/SaekiSTS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicetd/MizoguchiSTS21,
  author       = {Satoshi Mizoguchi and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {DNN-Based Low-Musical-Noise Single-Channel Speech Enhancement Based
                  on Higher-Order-Moments Matching},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {104-D},
  number       = {11},
  pages        = {1971--1980},
  year         = {2021},
  url          = {https://doi.org/10.1587/transinf.2021edp7041},
  doi          = {10.1587/TRANSINF.2021EDP7041},
  timestamp    = {Thu, 12 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicetd/MizoguchiSTS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/sigpro/MakishimaMTKSTK21,
  author       = {Naoki Makishima and
                  Yoshiki Mitsui and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Independent deeply learned matrix analysis with automatic selection
                  of stable microphone-wise update and fast sourcewise update of demixing
                  matrix},
  journal      = {Signal Process.},
  volume       = {178},
  pages        = {107753},
  year         = {2021},
  url          = {https://doi.org/10.1016/j.sigpro.2020.107753},
  doi          = {10.1016/J.SIGPRO.2020.107753},
  timestamp    = {Fri, 14 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/sigpro/MakishimaMTKSTK21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/sigpro/KamoMKTKSTK21,
  author       = {Keigo Kamo and
                  Yoshiki Mitsui and
                  Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Joint-diagonalizability-constrained multichannel nonnegative matrix
                  factorization based on time-variant multivariate complex sub-Gaussian
                  distribution},
  journal      = {Signal Process.},
  volume       = {188},
  pages        = {108183},
  year         = {2021},
  url          = {https://doi.org/10.1016/j.sigpro.2021.108183},
  doi          = {10.1016/J.SIGPRO.2021.108183},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/sigpro/KamoMKTKSTK21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/speech/MitsuiKS21,
  author       = {Kentaro Mitsui and
                  Tomoki Koriyama and
                  Hiroshi Saruwatari},
  title        = {Deep Gaussian process based multi-speaker speech synthesis with latent
                  speaker representation},
  journal      = {Speech Commun.},
  volume       = {132},
  pages        = {132--145},
  year         = {2021},
  url          = {https://doi.org/10.1016/j.specom.2021.07.001},
  doi          = {10.1016/J.SPECOM.2021.07.001},
  timestamp    = {Fri, 13 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/speech/MitsuiKS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/spl/SaekiTS21,
  author       = {Takaaki Saeki and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Incremental Text-to-Speech Synthesis Using Pseudo Lookahead With Large
                  Pretrained Language Model},
  journal      = {{IEEE} Signal Process. Lett.},
  volume       = {28},
  pages        = {857--861},
  year         = {2021},
  url          = {https://doi.org/10.1109/LSP.2021.3073869},
  doi          = {10.1109/LSP.2021.3073869},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/spl/SaekiTS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/MitsufujiTKS21,
  author       = {Yuki Mitsufuji and
                  Norihiro Takamune and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Multichannel Blind Source Separation Based on Evanescent-Region-Aware
                  Non-Negative Tensor Factorization in Spherical Harmonic Domain},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {29},
  pages        = {607--617},
  year         = {2021},
  url          = {https://doi.org/10.1109/TASLP.2020.3045528},
  doi          = {10.1109/TASLP.2020.3045528},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/MitsufujiTKS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/SaitoTS21,
  author       = {Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Perceptual-Similarity-Aware Deep Speaker Representation Learning for
                  Multi-Speaker Generative Modeling},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {29},
  pages        = {1033--1048},
  year         = {2021},
  url          = {https://doi.org/10.1109/TASLP.2021.3059114},
  doi          = {10.1109/TASLP.2021.3059114},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/SaitoTS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/NakamuraKS21,
  author       = {Tomohiko Nakamura and
                  Shihori Kozuka and
                  Hiroshi Saruwatari},
  title        = {Time-Domain Audio Source Separation With Neural Networks Based on
                  Multiresolution Analysis},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {29},
  pages        = {1687--1701},
  year         = {2021},
  url          = {https://doi.org/10.1109/TASLP.2021.3072496},
  doi          = {10.1109/TASLP.2021.3072496},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/NakamuraKS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/KoyamaBIUS21,
  author       = {Shoichi Koyama and
                  Jesper Brunnstr{\"{o}}m and
                  Hayato Ito and
                  Natsuki Ueno and
                  Hiroshi Saruwatari},
  title        = {Spatial Active Noise Control Based on Kernel Interpolation of Sound
                  Field},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {29},
  pages        = {3052--3063},
  year         = {2021},
  url          = {https://doi.org/10.1109/TASLP.2021.3107983},
  doi          = {10.1109/TASLP.2021.3107983},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/KoyamaBIUS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tsp/UenoKS21,
  author       = {Natsuki Ueno and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Directionally Weighted Wave Field Estimation Exploiting Prior Information
                  on Source Direction},
  journal      = {{IEEE} Trans. Signal Process.},
  volume       = {69},
  pages        = {2383--2395},
  year         = {2021},
  url          = {https://doi.org/10.1109/TSP.2021.3070228},
  doi          = {10.1109/TSP.2021.3070228},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tsp/UenoKS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/MisawaTNKSUM21,
  author       = {Sota Misawa and
                  Norihiro Takamune and
                  Tomohiko Nakamura and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Masakazu Une and
                  Shoji Makino},
  title        = {Speech Enhancement by Noise Self-Supervised Rank-Constrained Spatial
                  Covariance Matrix Estimation via Independent Deeply Learned Matrix
                  Analysis},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2021, Tokyo, Japan, December
                  14-17, 2021},
  pages        = {578--584},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://ieeexplore.ieee.org/document/9689665},
  timestamp    = {Wed, 09 Feb 2022 09:03:08 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/MisawaTNKSUM21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/MizobuchiKNSTK21,
  author       = {Yusaku Mizobuchi and
                  Daichi Kitamura and
                  Tomohiko Nakamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Prior Distribution Design for Music Bleeding-Sound Reduction Based
                  on Nonnegative Matrix Factorization},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2021, Tokyo, Japan, December
                  14-17, 2021},
  pages        = {651--658},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://ieeexplore.ieee.org/document/9689601},
  timestamp    = {Wed, 09 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/MizobuchiKNSTK21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/LuoTKSS21,
  author       = {Xuan Luo and
                  Shinnosuke Takamichi and
                  Tomoki Koriyama and
                  Yuki Saito and
                  Hiroshi Saruwatari},
  title        = {Emotion-Controllable Speech Synthesis Using Emotion Soft Labels and
                  Fine-Grained Prosody Factors},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2021, Tokyo, Japan, December
                  14-17, 2021},
  pages        = {794--799},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://ieeexplore.ieee.org/document/9689217},
  timestamp    = {Wed, 09 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/LuoTKSS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/HasumiNTSKTK21,
  author       = {Takuya Hasumi and
                  Tomohiko Nakamura and
                  Norihiro Takamune and
                  Hiroshi Saruwatari and
                  Daichi Kitamura and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Multichannel Audio Source Separation with Independent Deeply Learned
                  Matrix Analysis Using Product of Source Models},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2021, Tokyo, Japan, December
                  14-17, 2021},
  pages        = {1226--1233},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://ieeexplore.ieee.org/document/9689636},
  timestamp    = {Sun, 22 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/HasumiNTSKTK21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/SaekiTS21,
  author       = {Takaaki Saeki and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Low-Latency Incremental Text-to-Speech Synthesis with Distilled Context
                  Prediction Network},
  booktitle    = {{IEEE} Automatic Speech Recognition and Understanding Workshop, {ASRU}
                  2021, Cartagena, Colombia, December 13-17, 2021},
  pages        = {749--756},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ASRU51503.2021.9687904},
  doi          = {10.1109/ASRU51503.2021.9687904},
  timestamp    = {Wed, 09 Feb 2022 09:03:03 +0100},
  biburl       = {https://dblp.org/rec/conf/asru/SaekiTS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/SaitoNYKS21,
  author       = {Koichi Saito and
                  Tomohiko Nakamura and
                  Kohei Yatabe and
                  Yuma Koizumi and
                  Hiroshi Saruwatari},
  title        = {Sampling-Frequency-Independent Audio Source Separation Using Convolution
                  Layer Based on Impulse Invariant Method},
  booktitle    = {29th European Signal Processing Conference, {EUSIPCO} 2021, Dublin,
                  Ireland, August 23-27, 2021},
  pages        = {321--325},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.23919/EUSIPCO54536.2021.9615941},
  doi          = {10.23919/EUSIPCO54536.2021.9615941},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eusipco/SaitoNYKS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/NarisawaITKNSN21,
  author       = {Naoki Narisawa and
                  Rintaro Ikeshita and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Tomohiko Nakamura and
                  Hiroshi Saruwatari and
                  Tomohiro Nakatani},
  title        = {Independent Deeply Learned Tensor Analysis for Determined Audio Source
                  Separation},
  booktitle    = {29th European Signal Processing Conference, {EUSIPCO} 2021, Dublin,
                  Ireland, August 23-27, 2021},
  pages        = {326--330},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.23919/EUSIPCO54536.2021.9616300},
  doi          = {10.23919/EUSIPCO54536.2021.9616300},
  timestamp    = {Mon, 03 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eusipco/NarisawaITKNSN21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/HasumiNTSKTK21,
  author       = {Takuya Hasumi and
                  Tomohiko Nakamura and
                  Norihiro Takamune and
                  Hiroshi Saruwatari and
                  Daichi Kitamura and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Empirical Bayesian Independent Deeply Learned Matrix Analysis For
                  Multichannel Audio Source Separation},
  booktitle    = {29th European Signal Processing Conference, {EUSIPCO} 2021, Dublin,
                  Ireland, August 23-27, 2021},
  pages        = {331--335},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.23919/EUSIPCO54536.2021.9616245},
  doi          = {10.23919/EUSIPCO54536.2021.9616245},
  timestamp    = {Mon, 03 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eusipco/HasumiNTSKTK21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KoyamaAUS21,
  author       = {Shoichi Koyama and
                  Takashi Amakasu and
                  Natsuki Ueno and
                  Hiroshi Saruwatari},
  title        = {Amplitude Matching: Majorization-Minimization Algorithm for Sound
                  Field Control Only with Amplitude Constraint},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2021, Toronto, ON, Canada, June 6-11, 2021},
  pages        = {411--415},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICASSP39728.2021.9414855},
  doi          = {10.1109/ICASSP39728.2021.9414855},
  timestamp    = {Thu, 08 Jul 2021 17:12:48 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KoyamaAUS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KondoKTKS21,
  author       = {Yuto Kondo and
                  Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari},
  title        = {Deficient Basis Estimation of Noise Spatial Covariance Matrix for
                  Rank-Constrained Spatial Covariance Matrix Estimation Method in Blind
                  Speech Extraction},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2021, Toronto, ON, Canada, June 6-11, 2021},
  pages        = {806--810},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICASSP39728.2021.9414479},
  doi          = {10.1109/ICASSP39728.2021.9414479},
  timestamp    = {Thu, 08 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KondoKTKS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/UedaFSTBS21,
  author       = {Yota Ueda and
                  Kazuki Fujii and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Yukino Baba and
                  Hiroshi Saruwatari},
  title        = {Humanacgan: Conditional Generative Adversarial Network with Human-Based
                  Auxiliary Classifier and its Evaluation in Phoneme Perception},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2021, Toronto, ON, Canada, June 6-11, 2021},
  pages        = {6468--6472},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICASSP39728.2021.9413363},
  doi          = {10.1109/ICASSP39728.2021.9413363},
  timestamp    = {Fri, 09 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/UedaFSTBS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/XinKTS21,
  author       = {Detai Xin and
                  Tatsuya Komatsu and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Disentangled Speaker and Language Representations Using Mutual Information
                  Minimization and Domain Adaptation for Cross-Lingual {TTS}},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2021, Toronto, ON, Canada, June 6-11, 2021},
  pages        = {6608--6612},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICASSP39728.2021.9414226},
  doi          = {10.1109/ICASSP39728.2021.9414226},
  timestamp    = {Fri, 09 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/XinKTS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/NakamuraKS21,
  author       = {Taiki Nakamura and
                  Tomoki Koriyama and
                  Hiroshi Saruwatari},
  editor       = {Hynek Hermansky and
                  Honza Cernock{\'{y}} and
                  Luk{\'{a}}s Burget and
                  Lori Lamel and
                  Odette Scharenborg and
                  Petr Motl{\'{\i}}cek},
  title        = {Sequence-to-Sequence Learning for Deep Gaussian Process Based Speech
                  Synthesis Using Self-Attention {GP} Layer},
  booktitle    = {Interspeech 2021, 22nd Annual Conference of the International Speech
                  Communication Association, Brno, Czechia, 30 August - 3 September
                  2021},
  pages        = {121--125},
  publisher    = {{ISCA}},
  year         = {2021},
  url          = {https://doi.org/10.21437/Interspeech.2021-896},
  doi          = {10.21437/INTERSPEECH.2021-896},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/NakamuraKS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/XinSTKS21,
  author       = {Detai Xin and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Tomoki Koriyama and
                  Hiroshi Saruwatari},
  editor       = {Hynek Hermansky and
                  Honza Cernock{\'{y}} and
                  Luk{\'{a}}s Burget and
                  Lori Lamel and
                  Odette Scharenborg and
                  Petr Motl{\'{\i}}cek},
  title        = {Cross-Lingual Speaker Adaptation Using Domain Adaptation and Speaker
                  Consistency Loss for Text-To-Speech Synthesis},
  booktitle    = {Interspeech 2021, 22nd Annual Conference of the International Speech
                  Communication Association, Brno, Czechia, 30 August - 3 September
                  2021},
  pages        = {1614--1618},
  publisher    = {{ISCA}},
  year         = {2021},
  url          = {https://doi.org/10.21437/Interspeech.2021-897},
  doi          = {10.21437/INTERSPEECH.2021-897},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/XinSTKS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/MizutaKS21,
  author       = {Kazuki Mizuta and
                  Tomoki Koriyama and
                  Hiroshi Saruwatari},
  editor       = {Hynek Hermansky and
                  Honza Cernock{\'{y}} and
                  Luk{\'{a}}s Burget and
                  Lori Lamel and
                  Odette Scharenborg and
                  Petr Motl{\'{\i}}cek},
  title        = {Harmonic WaveGAN: GAN-Based Speech Waveform Generation Model with
                  Harmonic Structure Discriminator},
  booktitle    = {Interspeech 2021, 22nd Annual Conference of the International Speech
                  Communication Association, Brno, Czechia, 30 August - 3 September
                  2021},
  pages        = {2192--2196},
  publisher    = {{ISCA}},
  year         = {2021},
  url          = {https://doi.org/10.21437/Interspeech.2021-583},
  doi          = {10.21437/INTERSPEECH.2021-583},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/MizutaKS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/waspaa/HoriuchiKRUS21,
  author       = {Ryosuke Horiuchi and
                  Shoichi Koyama and
                  Juliano G. C. Ribeiro and
                  Natsuki Ueno and
                  Hiroshi Saruwatari},
  title        = {Kernel Learning for Sound Field Estimation with {L1} and {L2} Regularizations},
  booktitle    = {{IEEE} Workshop on Applications of Signal Processing to Audio and
                  Acoustics, {WASPAA} 2021, New Paltz, NY, USA, October 17-20, 2021},
  pages        = {261--265},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/WASPAA52581.2021.9632731},
  doi          = {10.1109/WASPAA52581.2021.9632731},
  timestamp    = {Tue, 21 Dec 2021 10:11:15 +0100},
  biburl       = {https://dblp.org/rec/conf/waspaa/HoriuchiKRUS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/waspaa/KimuraKUS21,
  author       = {Keisuke Kimura and
                  Shoichi Koyama and
                  Natsuki Ueno and
                  Hiroshi Saruwatari},
  title        = {Mean-Square-Error-Based Secondary Source Placement in Sound Field
                  Synthesis with Prior Information on Desired Field},
  booktitle    = {{IEEE} Workshop on Applications of Signal Processing to Audio and
                  Acoustics, {WASPAA} 2021, New Paltz, NY, USA, October 17-20, 2021},
  pages        = {281--285},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/WASPAA52581.2021.9632799},
  doi          = {10.1109/WASPAA52581.2021.9632799},
  timestamp    = {Tue, 21 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/waspaa/KimuraKUS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-04051,
  author       = {Yota Ueda and
                  Kazuki Fujii and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Yukino Baba and
                  Hiroshi Saruwatari},
  title        = {HumanACGAN: conditional generative adversarial network with human-based
                  auxiliary classifier and its evaluation in phoneme perception},
  journal      = {CoRR},
  volume       = {abs/2102.04051},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.04051},
  eprinttype    = {arXiv},
  eprint       = {2102.04051},
  timestamp    = {Wed, 10 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-04051.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-02491,
  author       = {Yuto Kondo and
                  Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari},
  title        = {Deficient Basis Estimation of Noise Spatial Covariance Matrix for
                  Rank-Constrained Spatial Covariance Matrix Estimation Method in Blind
                  Speech Extraction},
  journal      = {CoRR},
  volume       = {abs/2105.02491},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.02491},
  eprinttype    = {arXiv},
  eprint       = {2105.02491},
  timestamp    = {Wed, 12 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-02491.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-04079,
  author       = {Koichi Saito and
                  Tomohiko Nakamura and
                  Kohei Yatabe and
                  Yuma Koizumi and
                  Hiroshi Saruwatari},
  title        = {Sampling-Frequency-Independent Audio Source Separation Using Convolution
                  Layer Based on Impulse Invariant Method},
  journal      = {CoRR},
  volume       = {abs/2105.04079},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.04079},
  eprinttype    = {arXiv},
  eprint       = {2105.04079},
  timestamp    = {Fri, 14 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-04079.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-03492,
  author       = {Takuya Hasumi and
                  Tomohiko Nakamura and
                  Norihiro Takamune and
                  Hiroshi Saruwatari and
                  Daichi Kitamura and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Empirical Bayesian Independent Deeply Learned Matrix Analysis For
                  Multichannel Audio Source Separation},
  journal      = {CoRR},
  volume       = {abs/2106.03492},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.03492},
  eprinttype    = {arXiv},
  eprint       = {2106.03492},
  timestamp    = {Thu, 10 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-03492.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-05529,
  author       = {Naoki Narisawa and
                  Rintaro Ikeshita and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Tomohiko Nakamura and
                  Hiroshi Saruwatari and
                  Tomohiro Nakatani},
  title        = {Independent Deeply Learned Tensor Analysis for Determined Audio Source
                  Separation},
  journal      = {CoRR},
  volume       = {abs/2106.05529},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.05529},
  eprinttype    = {arXiv},
  eprint       = {2106.05529},
  timestamp    = {Tue, 15 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-05529.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-00237,
  author       = {Yusaku Mizobuchi and
                  Daichi Kitamura and
                  Tomohiko Nakamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Prior Distribution Design for Music Bleeding-Sound Reduction Based
                  on Nonnegative Matrix Factorization},
  journal      = {CoRR},
  volume       = {abs/2109.00237},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.00237},
  eprinttype    = {arXiv},
  eprint       = {2109.00237},
  timestamp    = {Mon, 20 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-00237.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-00704,
  author       = {Takuya Hasumi and
                  Tomohiko Nakamura and
                  Norihiro Takamune and
                  Hiroshi Saruwatari and
                  Daichi Kitamura and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Multichannel Audio Source Separation with Independent Deeply Learned
                  Matrix Analysis Using Product of Source Models},
  journal      = {CoRR},
  volume       = {abs/2109.00704},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.00704},
  eprinttype    = {arXiv},
  eprint       = {2109.00704},
  timestamp    = {Mon, 20 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-00704.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-04658,
  author       = {Sota Misawa and
                  Norihiro Takamune and
                  Tomohiko Nakamura and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Masakazu Une and
                  Shoji Makino},
  title        = {Speech Enhancement by Noise Self-Supervised Rank-Constrained Spatial
                  Covariance Matrix Estimation via Independent Deeply Learned Matrix
                  Analysis},
  journal      = {CoRR},
  volume       = {abs/2109.04658},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.04658},
  eprinttype    = {arXiv},
  eprint       = {2109.04658},
  timestamp    = {Tue, 21 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-04658.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-07274,
  author       = {Naoto Iijima and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Binaural rendering from microphone array signals of arbitrary geometry},
  journal      = {CoRR},
  volume       = {abs/2109.07274},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.07274},
  eprinttype    = {arXiv},
  eprint       = {2109.07274},
  timestamp    = {Wed, 22 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-07274.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-10724,
  author       = {Takaaki Saeki and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Low-Latency Incremental Text-to-Speech Synthesis with Distilled Context
                  Prediction Network},
  journal      = {CoRR},
  volume       = {abs/2109.10724},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.10724},
  eprinttype    = {arXiv},
  eprint       = {2109.10724},
  timestamp    = {Mon, 27 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-10724.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-04972,
  author       = {Ryosuke Horiuchi and
                  Shoichi Koyama and
                  Juliano G. C. Ribeiro and
                  Natsuki Ueno and
                  Hiroshi Saruwatari},
  title        = {Kernel Learning For Sound Field Estimation With {L1} and {L2} Regularizations},
  journal      = {CoRR},
  volume       = {abs/2110.04972},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.04972},
  eprinttype    = {arXiv},
  eprint       = {2110.04972},
  timestamp    = {Thu, 21 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-04972.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2112-06774,
  author       = {Keisuke Kimura and
                  Shoichi Koyama and
                  Natsuki Ueno and
                  Hiroshi Saruwatari},
  title        = {Mean-square-error-based secondary source placement in sound field
                  synthesis with prior information on desired field},
  journal      = {CoRR},
  volume       = {abs/2112.06774},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.06774},
  eprinttype    = {arXiv},
  eprint       = {2112.06774},
  timestamp    = {Mon, 03 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-06774.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/TamaruSTKS20,
  author       = {Hiroki Tamaru and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Tomoki Koriyama and
                  Hiroshi Saruwatari},
  title        = {Generative Moment Matching Network-Based Neural Double-Tracking for
                  Synthesized and Natural Singing Voices},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {103-D},
  number       = {3},
  pages        = {639--647},
  year         = {2020},
  url          = {http://search.ieice.org/bin/summary.php?id=e103-d\_3\_639},
  doi          = {10.1587/TRANSINF.2019EDP7228},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ieicet/TamaruSTKS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicetd/KoguchiTMSS20,
  author       = {Junya Koguchi and
                  Shinnosuke Takamichi and
                  Masanori Morise and
                  Hiroshi Saruwatari and
                  Shigeki Sagayama},
  title        = {DNN-Based Full-Band Speech Synthesis Using {GMM} Approximation of
                  Spectral Envelope},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {103-D},
  number       = {12},
  pages        = {2673--2681},
  year         = {2020},
  url          = {https://doi.org/10.1587/transinf.2020EDP7075},
  doi          = {10.1587/TRANSINF.2020EDP7075},
  timestamp    = {Mon, 18 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ieicetd/KoguchiTMSS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/sigpro/TakamichiSTKS20,
  author       = {Shinnosuke Takamichi and
                  Yuki Saito and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari},
  title        = {Phase reconstruction from amplitude spectrograms based on directional-statistics
                  deep neural networks},
  journal      = {Signal Process.},
  volume       = {169},
  pages        = {107368},
  year         = {2020},
  url          = {https://doi.org/10.1016/j.sigpro.2019.107368},
  doi          = {10.1016/J.SIGPRO.2019.107368},
  timestamp    = {Fri, 14 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/sigpro/TakamichiSTKS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/sigpro/TakidaKUS20,
  author       = {Yuhta Takida and
                  Shoichi Koyama and
                  Natsuki Ueno and
                  Hiroshi Saruwatari},
  title        = {Reciprocity gap functional in spherical harmonic domain for gridless
                  sound field decomposition},
  journal      = {Signal Process.},
  volume       = {169},
  pages        = {107383},
  year         = {2020},
  url          = {https://doi.org/10.1016/j.sigpro.2019.107383},
  doi          = {10.1016/J.SIGPRO.2019.107383},
  timestamp    = {Fri, 14 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/sigpro/TakidaKUS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/speech/AsoTTS20,
  author       = {Masashi Aso and
                  Shinnosuke Takamichi and
                  Norihiro Takamune and
                  Hiroshi Saruwatari},
  title        = {Acoustic model-based subword tokenization and prosodic-context extraction
                  without language knowledge for text-to-speech synthesis},
  journal      = {Speech Commun.},
  volume       = {125},
  pages        = {53--60},
  year         = {2020},
  url          = {https://doi.org/10.1016/j.specom.2020.09.003},
  doi          = {10.1016/J.SPECOM.2020.09.003},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/speech/AsoTTS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/MitsufujiUTKKS20,
  author       = {Yuki Mitsufuji and
                  Stefan Uhlich and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Multichannel Non-Negative Matrix Factorization Using Banded Spatial
                  Covariance Matrices in Wavenumber Domain},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {28},
  pages        = {49--60},
  year         = {2020},
  url          = {https://doi.org/10.1109/TASLP.2019.2948770},
  doi          = {10.1109/TASLP.2019.2948770},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/MitsufujiUTKKS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/MogamiTKSTKO20,
  author       = {Shinichi Mogami and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo and
                  Nobutaka Ono},
  title        = {Independent Low-Rank Matrix Analysis Based on Time-Variant Sub-Gaussian
                  Source Model for Determined Blind Source Separation},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {28},
  pages        = {503--518},
  year         = {2020},
  url          = {https://doi.org/10.1109/TASLP.2019.2959257},
  doi          = {10.1109/TASLP.2019.2959257},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/MogamiTKSTKO20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/KuboTKS20,
  author       = {Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari},
  title        = {Blind Speech Extraction Based on Rank-Constrained Spatial Covariance
                  Matrix Estimation With Multivariate Generalized Gaussian Distribution},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {28},
  pages        = {1948--1963},
  year         = {2020},
  url          = {https://doi.org/10.1109/TASLP.2020.3003165},
  doi          = {10.1109/TASLP.2020.3003165},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/KuboTKS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/KamoKTKSTK20,
  author       = {Keigo Kamo and
                  Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Joint-Diagonalizability-Constrained Multichannel Nonnegative Matrix
                  Factorization Based on Multivariate Complex Student's t-distribution},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} 2020, Auckland, New Zealand, December
                  7-10, 2020},
  pages        = {869--874},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://ieeexplore.ieee.org/document/9306489},
  timestamp    = {Thu, 11 Feb 2021 11:44:30 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/KamoKTKSTK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/WatanabeKSTK20,
  author       = {Rui Watanabe and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {DNN-Based Frequency Component Prediction for Frequency-Domain Audio
                  Source Separation},
  booktitle    = {28th European Signal Processing Conference, {EUSIPCO} 2020, Amsterdam,
                  Netherlands, January 18-21, 2021},
  pages        = {805--809},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.23919/Eusipco47968.2020.9287225},
  doi          = {10.23919/EUSIPCO47968.2020.9287225},
  timestamp    = {Fri, 08 Jan 2021 16:18:38 +0100},
  biburl       = {https://dblp.org/rec/conf/eusipco/WatanabeKSTK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/KamoKTKSTK20,
  author       = {Keigo Kamo and
                  Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Joint-Diagonalizability-Constrained Multichannel Nonnegative Matrix
                  Factorization Based on Multivariate Complex Sub-Gaussian Distribution},
  booktitle    = {28th European Signal Processing Conference, {EUSIPCO} 2020, Amsterdam,
                  Netherlands, January 18-21, 2021},
  pages        = {890--894},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.23919/Eusipco47968.2020.9287572},
  doi          = {10.23919/EUSIPCO47968.2020.9287572},
  timestamp    = {Fri, 08 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eusipco/KamoKTKSTK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/NishidaUKS20,
  author       = {Tomoya Nishida and
                  Natsuki Ueno and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Sensor placement in arbitrarily restricted region for field estimation
                  based on Gaussian process},
  booktitle    = {28th European Signal Processing Conference, {EUSIPCO} 2020, Amsterdam,
                  Netherlands, January 18-21, 2021},
  pages        = {2289--2293},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.23919/Eusipco47968.2020.9287222},
  doi          = {10.23919/EUSIPCO47968.2020.9287222},
  timestamp    = {Fri, 08 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eusipco/NishidaUKS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ArigaNKUS20,
  author       = {Kentaro Ariga and
                  Tomoya Nishida and
                  Shoichi Koyama and
                  Natsuki Ueno and
                  Hiroshi Saruwatari},
  title        = {Mutual-Information-Based Sensor Placement for Spatial Sound Field
                  Recording},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {166--170},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9053715},
  doi          = {10.1109/ICASSP40776.2020.9053715},
  timestamp    = {Thu, 23 Jul 2020 16:19:28 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ArigaNKUS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/NakamuraS20,
  author       = {Tomohiko Nakamura and
                  Hiroshi Saruwatari},
  title        = {Time-Domain Audio Source Separation Based on Wave-U-Net Combined with
                  Discrete Wavelet Transform},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {386--390},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9053934},
  doi          = {10.1109/ICASSP40776.2020.9053934},
  timestamp    = {Sat, 05 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/NakamuraS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KamoKTKSTK20,
  author       = {Keigo Kamo and
                  Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Regularized Fast Multichannel Nonnegative Matrix Factorization with
                  ILRMA-Based Prior Distribution of Joint-Diagonalization Process},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {606--610},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9054603},
  doi          = {10.1109/ICASSP40776.2020.9054603},
  timestamp    = {Thu, 23 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KamoKTKSTK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KondoFTKSIN20,
  author       = {Tatsuki Kondo and
                  Kanta Fukushige and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Rintaro Ikeshita and
                  Tomohiro Nakatani},
  title        = {Convergence-Guaranteed Independent Positive Semidefinite Tensor Analysis
                  Based on Student's {T} Distribution},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {681--685},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9054150},
  doi          = {10.1109/ICASSP40776.2020.9054150},
  timestamp    = {Thu, 23 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KondoFTKSIN20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/FujiiSTBS20,
  author       = {Kazuki Fujii and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Yukino Baba and
                  Hiroshi Saruwatari},
  title        = {Humangan: Generative Adversarial Network With Human-Based Discriminator
                  And Its Evaluation In Speech Perception Modeling},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {6239--6243},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9053844},
  doi          = {10.1109/ICASSP40776.2020.9053844},
  timestamp    = {Tue, 29 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/FujiiSTBS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KoriyamaS20,
  author       = {Tomoki Koriyama and
                  Hiroshi Saruwatari},
  title        = {Utterance-Level Sequential Modeling for Deep Gaussian Process Based
                  Speech Synthesis Using Simple Recurrent Unit},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {7249--7253},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9052935},
  doi          = {10.1109/ICASSP40776.2020.9052935},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/KoriyamaS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SaekiSTS20,
  author       = {Takaaki Saeki and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Lifter Training and Sub-Band Modeling for Computationally Efficient
                  and High-Quality Voice Conversion Using Spectral Differentials},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {7784--7788},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9054490},
  doi          = {10.1109/ICASSP40776.2020.9054490},
  timestamp    = {Tue, 29 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/SaekiSTS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ItoKUS20,
  author       = {Hayato Ito and
                  Shoichi Koyama and
                  Natsuki Ueno and
                  Hiroshi Saruwatari},
  title        = {Spatial Active Noise Control Based on Kernel Interpolation with Directional
                  Weighting},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {8404--8408},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9053416},
  doi          = {10.1109/ICASSP40776.2020.9053416},
  timestamp    = {Thu, 23 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ItoKUS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ieeesam/RibeiroUKS20,
  author       = {Juliano G. C. Ribeiro and
                  Natsuki Ueno and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Kernel interpolation of acoustic transfer function between regions
                  considering reciprocity},
  booktitle    = {11th {IEEE} Sensor Array and Multichannel Signal Processing Workshop,
                  {SAM} 2020, Hangzhou, China, June 8-11, 2020},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/SAM48682.2020.9104256},
  doi          = {10.1109/SAM48682.2020.9104256},
  timestamp    = {Tue, 15 Jun 2021 19:37:23 +0200},
  biburl       = {https://dblp.org/rec/conf/ieeesam/RibeiroUKS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/TakeuchiKOS20,
  author       = {Hirotoshi Takeuchi and
                  Kunio Kashino and
                  Yasunori Ohishi and
                  Hiroshi Saruwatari},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {Harmonic Lowering for Accelerating Harmonic Convolution for Audio
                  Signals},
  booktitle    = {Interspeech 2020, 21st Annual Conference of the International Speech
                  Communication Association, Virtual Event, Shanghai, China, 25-29 October
                  2020},
  pages        = {185--189},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://doi.org/10.21437/Interspeech.2020-3185},
  doi          = {10.21437/INTERSPEECH.2020-3185},
  timestamp    = {Fri, 29 Jan 2021 17:40:16 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/TakeuchiKOS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SaekiSTS20,
  author       = {Takaaki Saeki and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {Real-Time, Full-Band, Online DNN-Based Voice Conversion System Using
                  a Single {CPU}},
  booktitle    = {Interspeech 2020, 21st Annual Conference of the International Speech
                  Communication Association, Virtual Event, Shanghai, China, 25-29 October
                  2020},
  pages        = {1021--1022},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://www.isca-speech.org/archive/interspeech\_2020/saeki20\_interspeech.html},
  timestamp    = {Tue, 27 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SaekiSTS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/MitsuiKS20,
  author       = {Kentaro Mitsui and
                  Tomoki Koriyama and
                  Hiroshi Saruwatari},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {Multi-Speaker Text-to-Speech Synthesis Using Deep Gaussian Processes},
  booktitle    = {Interspeech 2020, 21st Annual Conference of the International Speech
                  Communication Association, Virtual Event, Shanghai, China, 25-29 October
                  2020},
  pages        = {2032--2036},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://doi.org/10.21437/Interspeech.2020-3167},
  doi          = {10.21437/INTERSPEECH.2020-3167},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/MitsuiKS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/XinSTKS20,
  author       = {Detai Xin and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Tomoki Koriyama and
                  Hiroshi Saruwatari},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {Cross-Lingual Text-To-Speech Synthesis via Domain Adaptation and Perceptual
                  Similarity Regression in Speaker Space},
  booktitle    = {Interspeech 2020, 21st Annual Conference of the International Speech
                  Communication Association, Virtual Event, Shanghai, China, 25-29 October
                  2020},
  pages        = {2947--2951},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://doi.org/10.21437/Interspeech.2020-2070},
  doi          = {10.21437/INTERSPEECH.2020-2070},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/XinSTKS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/YamashitaKSTIMS20,
  author       = {Yuki Yamashita and
                  Tomoki Koriyama and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Yusuke Ijima and
                  Ryo Masumura and
                  Hiroshi Saruwatari},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {Investigating Effective Additional Contextual Factors in DNN-Based
                  Spontaneous Speech Synthesis},
  booktitle    = {Interspeech 2020, 21st Annual Conference of the International Speech
                  Communication Association, Virtual Event, Shanghai, China, 25-29 October
                  2020},
  pages        = {3201--3205},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://doi.org/10.21437/Interspeech.2020-2469},
  doi          = {10.21437/INTERSPEECH.2020-2469},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/YamashitaKSTIMS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/AsoTS20,
  author       = {Masashi Aso and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {End-to-End Text-to-Speech Synthesis with Unaligned Multiple Language
                  Units Based on Attention},
  booktitle    = {Interspeech 2020, 21st Annual Conference of the International Speech
                  Communication Association, Virtual Event, Shanghai, China, 25-29 October
                  2020},
  pages        = {4009--4013},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://doi.org/10.21437/Interspeech.2020-2347},
  doi          = {10.21437/INTERSPEECH.2020-2347},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/AsoTS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lrec/YamashitaKSTIMS20,
  author       = {Yuki Yamashita and
                  Tomoki Koriyama and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Yusuke Ijima and
                  Ryo Masumura and
                  Hiroshi Saruwatari},
  editor       = {Nicoletta Calzolari and
                  Fr{\'{e}}d{\'{e}}ric B{\'{e}}chet and
                  Philippe Blache and
                  Khalid Choukri and
                  Christopher Cieri and
                  Thierry Declerck and
                  Sara Goggi and
                  Hitoshi Isahara and
                  Bente Maegaard and
                  Joseph Mariani and
                  H{\'{e}}l{\`{e}}ne Mazo and
                  Asunci{\'{o}}n Moreno and
                  Jan Odijk and
                  Stelios Piperidis},
  title        = {DNN-based Speech Synthesis Using Abundant Tags of Spontaneous Speech
                  Corpus},
  booktitle    = {Proceedings of The 12th Language Resources and Evaluation Conference,
                  {LREC} 2020, Marseille, France, May 11-16, 2020},
  pages        = {6438--6443},
  publisher    = {European Language Resources Association},
  year         = {2020},
  url          = {https://aclanthology.org/2020.lrec-1.792/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/lrec/YamashitaKSTIMS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lrec/SaitoTS20,
  author       = {Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  editor       = {Nicoletta Calzolari and
                  Fr{\'{e}}d{\'{e}}ric B{\'{e}}chet and
                  Philippe Blache and
                  Khalid Choukri and
                  Christopher Cieri and
                  Thierry Declerck and
                  Sara Goggi and
                  Hitoshi Isahara and
                  Bente Maegaard and
                  Joseph Mariani and
                  H{\'{e}}l{\`{e}}ne Mazo and
                  Asunci{\'{o}}n Moreno and
                  Jan Odijk and
                  Stelios Piperidis},
  title        = {{SMASH} Corpus: {A} Spontaneous Speech Corpus Recording Third-person
                  Audio Commentaries on Gameplay},
  booktitle    = {Proceedings of The 12th Language Resources and Evaluation Conference,
                  {LREC} 2020, Marseille, France, May 11-16, 2020},
  pages        = {6571--6577},
  publisher    = {European Language Resources Association},
  year         = {2020},
  url          = {https://aclanthology.org/2020.lrec-1.809/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/lrec/SaitoTS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mmsp/IijimaKS20,
  author       = {Naoto Iijima and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Binaural Rendering From Distributed Microphone Signals Considering
                  Loudspeaker Distance in Measurements},
  booktitle    = {22nd {IEEE} International Workshop on Multimedia Signal Processing,
                  {MMSP} 2020, Tampere, Finland, September 21-24, 2020},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/MMSP48831.2020.9287157},
  doi          = {10.1109/MMSP48831.2020.9287157},
  timestamp    = {Wed, 13 Jan 2021 17:58:36 +0100},
  biburl       = {https://dblp.org/rec/conf/mmsp/IijimaKS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2001-07044,
  author       = {Hiroki Tamaru and
                  Shinnosuke Takamichi and
                  Naoko Tanji and
                  Hiroshi Saruwatari},
  title        = {JVS-MuSiC: Japanese multispeaker singing-voice corpus},
  journal      = {CoRR},
  volume       = {abs/2001.07044},
  year         = {2020},
  url          = {https://arxiv.org/abs/2001.07044},
  eprinttype    = {arXiv},
  eprint       = {2001.07044},
  timestamp    = {Fri, 24 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2001-07044.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2001-10190,
  author       = {Tomohiko Nakamura and
                  Hiroshi Saruwatari},
  title        = {Time-Domain Audio Source Separation Based on Wave-U-Net Combined with
                  Discrete Wavelet Transform},
  journal      = {CoRR},
  volume       = {abs/2001.10190},
  year         = {2020},
  url          = {https://arxiv.org/abs/2001.10190},
  eprinttype    = {arXiv},
  eprint       = {2001.10190},
  timestamp    = {Thu, 30 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2001-10190.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-00579,
  author       = {Keigo Kamo and
                  Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Regularized Fast Multichannel Nonnegative Matrix Factorization with
                  ILRMA-based Prior Distribution of Joint-Diagonalization Process},
  journal      = {CoRR},
  volume       = {abs/2002.00579},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.00579},
  eprinttype    = {arXiv},
  eprint       = {2002.00579},
  timestamp    = {Mon, 10 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-00579.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-06778,
  author       = {Takaaki Saeki and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Lifter Training and Sub-band Modeling for Computationally Efficient
                  and High-Quality Voice Conversion Using Spectral Differentials},
  journal      = {CoRR},
  volume       = {abs/2002.06778},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.06778},
  eprinttype    = {arXiv},
  eprint       = {2002.06778},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-06778.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-08582,
  author       = {Tatsuki Kondo and
                  Kanta Fukushige and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Rintaro Ikeshita and
                  Tomohiro Nakatani},
  title        = {Convergence-guaranteed Independent Positive Semidefinite Tensor Analysis
                  Based on Student's t Distribution},
  journal      = {CoRR},
  volume       = {abs/2002.08582},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.08582},
  eprinttype    = {arXiv},
  eprint       = {2002.08582},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-08582.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-10823,
  author       = {Tomoki Koriyama and
                  Hiroshi Saruwatari},
  title        = {Utterance-level Sequential Modeling For Deep Gaussian Process Based
                  Speech Synthesis Using Simple Recurrent Unit},
  journal      = {CoRR},
  volume       = {abs/2004.10823},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.10823},
  eprinttype    = {arXiv},
  eprint       = {2004.10823},
  timestamp    = {Wed, 29 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-10823.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-00416,
  author       = {Keigo Kamo and
                  Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Joint-Diagonalizability-Constrained Multichannel Nonnegative Matrix
                  Factorization Based on Multivariate Complex Sub-Gaussian Distribution},
  journal      = {CoRR},
  volume       = {abs/2007.00416},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.00416},
  eprinttype    = {arXiv},
  eprint       = {2007.00416},
  timestamp    = {Mon, 06 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-00416.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-02950,
  author       = {Kentaro Mitsui and
                  Tomoki Koriyama and
                  Hiroshi Saruwatari},
  title        = {Multi-speaker Text-to-speech Synthesis Using Deep Gaussian Processes},
  journal      = {CoRR},
  volume       = {abs/2008.02950},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.02950},
  eprinttype    = {arXiv},
  eprint       = {2008.02950},
  timestamp    = {Mon, 17 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-02950.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-01793,
  author       = {Shinnosuke Takamichi and
                  Mamoru Komachi and
                  Naoko Tanji and
                  Hiroshi Saruwatari},
  title        = {{JSSS:} free Japanese speech corpus for summarization and simplification},
  journal      = {CoRR},
  volume       = {abs/2010.01793},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.01793},
  eprinttype    = {arXiv},
  eprint       = {2010.01793},
  timestamp    = {Tue, 13 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-01793.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-12612,
  author       = {Takaaki Saeki and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Incremental Text-to-Speech Synthesis Using Pseudo Lookahead with Large
                  Pretrained Language Model},
  journal      = {CoRR},
  volume       = {abs/2012.12612},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.12612},
  eprinttype    = {arXiv},
  eprint       = {2012.12612},
  timestamp    = {Tue, 05 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-12612.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/csl/SaitoTS19,
  author       = {Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Vocoder-free text-to-speech synthesis incorporating generative adversarial
                  networks using low-/multi-frequency {STFT} amplitude spectra},
  journal      = {Comput. Speech Lang.},
  volume       = {58},
  pages        = {347--363},
  year         = {2019},
  url          = {https://doi.org/10.1016/j.csl.2019.05.008},
  doi          = {10.1016/J.CSL.2019.05.008},
  timestamp    = {Thu, 20 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/csl/SaitoTS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/MogamiMTKSTKNK19,
  author       = {Shinichi Mogami and
                  Yoshiki Mitsui and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo and
                  Hiroaki Nakajima and
                  Hirokazu Kameoka},
  title        = {Independent Low-Rank Matrix Analysis Based on Generalized Kullback-Leibler
                  Divergence},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {102-A},
  number       = {2},
  pages        = {458--463},
  year         = {2019},
  url          = {https://doi.org/10.1587/transfun.E102.A.458},
  doi          = {10.1587/TRANSFUN.E102.A.458},
  timestamp    = {Mon, 18 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ieicet/MogamiMTKSTKNK19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/SekizawaTS19,
  author       = {Daiki Sekizawa and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Prosody Correction Preserving Speaker Individuality for Chinese-Accented
                  Japanese HMM-Based Text-to-Speech Synthesis},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {102-D},
  number       = {6},
  pages        = {1218--1221},
  year         = {2019},
  url          = {https://doi.org/10.1587/transinf.2018EDL8264},
  doi          = {10.1587/TRANSINF.2018EDL8264},
  timestamp    = {Mon, 18 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ieicet/SekizawaTS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/spl/NakajimaKTSO19,
  author       = {Hiroaki Nakajima and
                  Daichi Kitamura and
                  Norihiro Takamune and
                  Hiroshi Saruwatari and
                  Nobutaka Ono},
  title        = {Bilevel Optimization Using Stationary Point of Lower-Level Objective
                  Function for Discriminative Basis Learning in Nonnegative Matrix Factorization},
  journal      = {{IEEE} Signal Process. Lett.},
  volume       = {26},
  number       = {6},
  pages        = {818--822},
  year         = {2019},
  url          = {https://doi.org/10.1109/LSP.2019.2909079},
  doi          = {10.1109/LSP.2019.2909079},
  timestamp    = {Fri, 27 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/spl/NakajimaKTSO19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/MakishimaMTKSTS19,
  author       = {Naoki Makishima and
                  Shinichi Mogami and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hayato Sumino and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari and
                  Nobutaka Ono},
  title        = {Independent Deeply Learned Matrix Analysis for Determined Audio Source
                  Separation},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {27},
  number       = {10},
  pages        = {1601--1615},
  year         = {2019},
  url          = {https://doi.org/10.1109/TASLP.2019.2925450},
  doi          = {10.1109/TASLP.2019.2925450},
  timestamp    = {Fri, 27 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/MakishimaMTKSTS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/UenoKS19,
  author       = {Natsuki Ueno and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Three-Dimensional Sound Field Reproduction Based on Weighted Mode-Matching
                  Method},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {27},
  number       = {12},
  pages        = {1852--1867},
  year         = {2019},
  url          = {https://doi.org/10.1109/TASLP.2019.2934834},
  doi          = {10.1109/TASLP.2019.2934834},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/UenoKS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/KuboTKS19,
  author       = {Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari},
  title        = {Acceleration of rank-constrained spatial covariance matrix estimation
                  for blind speech extraction},
  booktitle    = {2019 Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2019, Lanzhou, China, November
                  18-21, 2019},
  pages        = {332--338},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/APSIPAASC47483.2019.9023281},
  doi          = {10.1109/APSIPAASC47483.2019.9023281},
  timestamp    = {Fri, 13 Mar 2020 10:17:58 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/KuboTKS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/MakishimaTSKTK19,
  author       = {Naoki Makishima and
                  Norihiro Takamune and
                  Hiroshi Saruwatari and
                  Daichi Kitamura and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Robust Demixing Filter Update Algorithm Based on Microphone-wise Coordinate
                  Descent for Independent Deeply Learned Matrix Analysis},
  booktitle    = {2019 Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2019, Lanzhou, China, November
                  18-21, 2019},
  pages        = {1868--1873},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/APSIPAASC47483.2019.9023032},
  doi          = {10.1109/APSIPAASC47483.2019.9023032},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/MakishimaTSKTK19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/UneKTKSM19,
  author       = {Masakazu Une and
                  Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Shoji Makino},
  title        = {Evaluation of Multichannel Hearing Aid System by Rank-Constrained
                  Spatial Covariance Matrix Estimation},
  booktitle    = {2019 Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2019, Lanzhou, China, November
                  18-21, 2019},
  pages        = {1874--1879},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/APSIPAASC47483.2019.9023081},
  doi          = {10.1109/APSIPAASC47483.2019.9023081},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/UneKTKSM19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/KuboTKS19,
  author       = {Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari},
  title        = {Efficient Full-Rank Spatial Covariance Estimation Using Independent
                  Low-Rank Matrix Analysis for Blind Source Separation},
  booktitle    = {27th European Signal Processing Conference, {EUSIPCO} 2019, {A} Coru{\~{n}}a,
                  Spain, September 2-6, 2019},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.23919/EUSIPCO.2019.8903026},
  doi          = {10.23919/EUSIPCO.2019.8903026},
  timestamp    = {Mon, 25 Nov 2019 12:04:51 +0100},
  biburl       = {https://dblp.org/rec/conf/eusipco/KuboTKS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ItoKUS19,
  author       = {Hayato Ito and
                  Shoichi Koyama and
                  Natsuki Ueno and
                  Hiroshi Saruwatari},
  title        = {Feedforward Spatial Active Noise Control Based on Kernel Interpolation
                  of Sound Field},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019},
  pages        = {511--515},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICASSP.2019.8683067},
  doi          = {10.1109/ICASSP.2019.8683067},
  timestamp    = {Fri, 27 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/ItoKUS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TakidaKUS19,
  author       = {Yuhta Takida and
                  Shoichi Koyama and
                  Natsuki Ueno and
                  Hiroshi Saruwatari},
  title        = {Robust Gridless Sound Field Decomposition Based on Structured Reciprocity
                  Gap Functional in Spherical Harmonic Domain},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019},
  pages        = {581--585},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICASSP.2019.8683310},
  doi          = {10.1109/ICASSP.2019.8683310},
  timestamp    = {Fri, 27 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/TakidaKUS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TamaruSTKS19,
  author       = {Hiroki Tamaru and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Tomoki Koriyama and
                  Hiroshi Saruwatari},
  title        = {Generative Moment Matching Network-based Random Modulation Post-filter
                  for DNN-based Singing Voice Synthesis and Neural Double-tracking},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019},
  pages        = {7070--7074},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICASSP.2019.8683476},
  doi          = {10.1109/ICASSP.2019.8683476},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/TamaruSTKS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uist/ArakawaTS19,
  author       = {Riku Arakawa and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  editor       = {Fran{\c{c}}ois Guimbreti{\`{e}}re and
                  Michael S. Bernstein and
                  Katharina Reinecke},
  title        = {TransVoice: Real-Time Voice Conversion for Augmenting Near-Field Speech
                  Communication},
  booktitle    = {Adjunct Proceedings of the 32nd Annual {ACM} Symposium on User Interface
                  Software and Technology, {UIST} 2019, New Orleans, LA, USA, October
                  20-23, 2019},
  pages        = {33--35},
  publisher    = {{ACM}},
  year         = {2019},
  url          = {https://doi.org/10.1145/3332167.3357106},
  doi          = {10.1145/3332167.3357106},
  timestamp    = {Fri, 04 Feb 2022 08:27:42 +0100},
  biburl       = {https://dblp.org/rec/conf/uist/ArakawaTS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/waspaa/NakanishiUKS19,
  author       = {Masahiro Nakanishi and
                  Natsuki Ueno and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Two-Dimensional Sound Field Recording With Multiple Circular Microphone
                  Arrays Considering Multiple Scattering},
  booktitle    = {2019 {IEEE} Workshop on Applications of Signal Processing to Audio
                  and Acoustics, {WASPAA} 2019, New Paltz, NY, USA, October 20-23, 2019},
  pages        = {368--372},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/WASPAA.2019.8937208},
  doi          = {10.1109/WASPAA.2019.8937208},
  timestamp    = {Fri, 27 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/waspaa/NakanishiUKS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-03389,
  author       = {Hiroki Tamaru and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Tomoki Koriyama and
                  Hiroshi Saruwatari},
  title        = {Generative Moment Matching Network-based Random Modulation Post-filter
                  for DNN-based Singing Voice Synthesis and Neural Double-tracking},
  journal      = {CoRR},
  volume       = {abs/1902.03389},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.03389},
  eprinttype    = {arXiv},
  eprint       = {1902.03389},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-03389.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-02482,
  author       = {Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari},
  title        = {Efficient Full-Rank Spatial Covariance Estimation Using Independent
                  Low-Rank Matrix Analysis for Blind Source Separation},
  journal      = {CoRR},
  volume       = {abs/1906.02482},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.02482},
  eprinttype    = {arXiv},
  eprint       = {1906.02482},
  timestamp    = {Thu, 13 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-02482.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-08294,
  author       = {Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {DNN-based Speaker Embedding Using Subjective Inter-speaker Similarity
                  for Multi-speaker Modeling in Speech Synthesis},
  journal      = {CoRR},
  volume       = {abs/1907.08294},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.08294},
  eprinttype    = {arXiv},
  eprint       = {1907.08294},
  timestamp    = {Tue, 23 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-08294.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1908-01454,
  author       = {Taiki Nakamura and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Yusuke Ijima and
                  Hiroshi Saruwatari},
  title        = {{V2S} attack: building DNN-based voice conversion from automatic speaker
                  verification},
  journal      = {CoRR},
  volume       = {abs/1908.01454},
  year         = {2019},
  url          = {http://arxiv.org/abs/1908.01454},
  eprinttype    = {arXiv},
  eprint       = {1908.01454},
  timestamp    = {Fri, 09 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1908-01454.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1908-01964,
  author       = {Yuki Kubo and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari},
  title        = {Acceleration of rank-constrained spatial covariance matrix estimation
                  for blind speech extraction},
  journal      = {CoRR},
  volume       = {abs/1908.01964},
  year         = {2019},
  url          = {http://arxiv.org/abs/1908.01964},
  eprinttype    = {arXiv},
  eprint       = {1908.01964},
  timestamp    = {Fri, 09 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1908-01964.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1908-06248,
  author       = {Shinnosuke Takamichi and
                  Kentaro Mitsui and
                  Yuki Saito and
                  Tomoki Koriyama and
                  Naoko Tanji and
                  Hiroshi Saruwatari},
  title        = {{JVS} corpus: free Japanese multi-speaker voice corpus},
  journal      = {CoRR},
  volume       = {abs/1908.06248},
  year         = {2019},
  url          = {http://arxiv.org/abs/1908.06248},
  eprinttype    = {arXiv},
  eprint       = {1908.06248},
  timestamp    = {Mon, 26 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1908-06248.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-11391,
  author       = {Kazuki Fujii and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Yukino Baba and
                  Hiroshi Saruwatari},
  title        = {HumanGAN: generative adversarial network with human-based discriminator
                  and its evaluation in speech perception modeling},
  journal      = {CoRR},
  volume       = {abs/1909.11391},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.11391},
  eprinttype    = {arXiv},
  eprint       = {1909.11391},
  timestamp    = {Fri, 27 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-11391.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ejasp/KitamuraMMTSOTK18,
  author       = {Daichi Kitamura and
                  Shinichi Mogami and
                  Yoshiki Mitsui and
                  Norihiro Takamune and
                  Hiroshi Saruwatari and
                  Nobutaka Ono and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Generalized independent low-rank matrix analysis using heavy-tailed
                  distributions for blind source separation},
  journal      = {{EURASIP} J. Adv. Signal Process.},
  volume       = {2018},
  pages        = {28},
  year         = {2018},
  url          = {https://doi.org/10.1186/s13634-018-0549-5},
  doi          = {10.1186/S13634-018-0549-5},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ejasp/KitamuraMMTSOTK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/spl/UenoKS18,
  author       = {Natsuki Ueno and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Sound Field Recording Using Distributed Microphones Based on Harmonic
                  Analysis of Infinite Order},
  journal      = {{IEEE} Signal Process. Lett.},
  volume       = {25},
  number       = {1},
  pages        = {135--139},
  year         = {2018},
  url          = {https://doi.org/10.1109/LSP.2017.2775242},
  doi          = {10.1109/LSP.2017.2775242},
  timestamp    = {Wed, 04 Jul 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/spl/UenoKS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/SaitoTS18,
  author       = {Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Statistical Parametric Speech Synthesis Incorporating Generative Adversarial
                  Networks},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {26},
  number       = {1},
  pages        = {84--96},
  year         = {2018},
  url          = {https://doi.org/10.1109/TASLP.2017.2761547},
  doi          = {10.1109/TASLP.2017.2761547},
  timestamp    = {Tue, 29 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/SaitoTS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tsp/MurataKTS18,
  author       = {Naoki Murata and
                  Shoichi Koyama and
                  Norihiro Takamune and
                  Hiroshi Saruwatari},
  title        = {Sparse Representation Using Multidimensional Mixed-Norm Penalty With
                  Application to Sound Field Decomposition},
  journal      = {{IEEE} Trans. Signal Process.},
  volume       = {66},
  number       = {12},
  pages        = {3327--3338},
  year         = {2018},
  url          = {https://doi.org/10.1109/TSP.2018.2830318},
  doi          = {10.1109/TSP.2018.2830318},
  timestamp    = {Tue, 10 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tsp/MurataKTS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/UneSTKMS18,
  author       = {Masakazu Une and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Daichi Kitamura and
                  Ryoichi Miyazaki and
                  Hiroshi Saruwatari},
  title        = {Generative approach using the noise generation models for DNN-based
                  speech synthesis trained from noisy speech},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
                  12-15, 2018},
  pages        = {340--344},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.23919/APSIPA.2018.8659691},
  doi          = {10.23919/APSIPA.2018.8659691},
  timestamp    = {Tue, 29 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/UneSTKMS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/AkiyamaTS18,
  author       = {Takanori Akiyama and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Prosody-aware subword embedding considering Japanese intonation systems
                  and its application to DNN-based multi-dialect speech synthesis},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
                  12-15, 2018},
  pages        = {659--664},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.23919/APSIPA.2018.8659465},
  doi          = {10.23919/APSIPA.2018.8659465},
  timestamp    = {Sat, 09 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/AkiyamaTS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/MogamiTKSTKNO18,
  author       = {Shinichi Mogami and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo and
                  Hiroaki Nakajima and
                  Nobutaka Ono},
  title        = {Independent Low-Rank Matrix Analysis Based on Time-Variant Sub-Gaussian
                  Source Model},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
                  12-15, 2018},
  pages        = {1684--1691},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.23919/APSIPA.2018.8659577},
  doi          = {10.23919/APSIPA.2018.8659577},
  timestamp    = {Fri, 27 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/MogamiTKSTKNO18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/MogamiSKTTSO18,
  author       = {Shinichi Mogami and
                  Hayato Sumino and
                  Daichi Kitamura and
                  Norihiro Takamune and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari and
                  Nobutaka Ono},
  title        = {Independent Deeply Learned Matrix Analysis for Multichannel Audio
                  Source Separation},
  booktitle    = {26th European Signal Processing Conference, {EUSIPCO} 2018, Roma,
                  Italy, September 3-7, 2018},
  pages        = {1557--1561},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.23919/EUSIPCO.2018.8553246},
  doi          = {10.23919/EUSIPCO.2018.8553246},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/MogamiSKTTSO18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/TakidaKS18,
  author       = {Yuhta Takida and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Exterior and Interior Sound Field Separation Using Convex Optimization:
                  Comparison of Signal Models},
  booktitle    = {26th European Signal Processing Conference, {EUSIPCO} 2018, Roma,
                  Italy, September 3-7, 2018},
  pages        = {2549--2553},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.23919/EUSIPCO.2018.8552928},
  doi          = {10.23919/EUSIPCO.2018.8552928},
  timestamp    = {Fri, 27 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eusipco/TakidaKS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/UenoKS18,
  author       = {Natsuki Ueno and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Sound Field Reproduction with Exterior Cancellation Using Analytical
                  Weighting of Harmonic Coefficients},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {466--470},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8462084},
  doi          = {10.1109/ICASSP.2018.8462084},
  timestamp    = {Fri, 27 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/UenoKS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MitsuiTKSTK18,
  author       = {Yoshiki Mitsui and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Vectorwise Coordinate Descent Algorithm for Spatially Regularized
                  Independent Low-Rank Matrix Analysis},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {746--750},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8462657},
  doi          = {10.1109/ICASSP.2018.8462657},
  timestamp    = {Tue, 18 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MitsuiTKSTK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SaitoTS18,
  author       = {Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Text-to-Speech Synthesis Using {STFT} Spectra Based on Low-/Multi-Resolution
                  Generative Adversarial Networks},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {5299--5303},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8461714},
  doi          = {10.1109/ICASSP.2018.8461714},
  timestamp    = {Tue, 29 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/SaitoTS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ieeesam/TakidaKUS18,
  author       = {Yuhta Takida and
                  Shoichi Koyama and
                  Natsuki Ueno and
                  Hiroshi Saruwatari},
  title        = {Gridless Sound Field Decomposition Based on Reciprocity Gap Functional
                  in Spherical Harmonic Domain},
  booktitle    = {10th {IEEE} Sensor Array and Multichannel Signal Processing Workshop,
                  {SAM} 2018, Sheffield, South Yorkshire, United Kingdom, July 8-11,
                  2018},
  pages        = {627--631},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/SAM.2018.8448736},
  doi          = {10.1109/SAM.2018.8448736},
  timestamp    = {Fri, 27 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ieeesam/TakidaKUS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwaenc/UenoKS18,
  author       = {Natsuki Ueno and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Kernel Ridge Regression with Constraint of Helmholtz Equation for
                  Sound Field Interpolation},
  booktitle    = {16th International Workshop on Acoustic Signal Enhancement, {IWAENC}
                  2018, Tokyo, Japan, September 17-20, 2018},
  pages        = {1--440},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/IWAENC.2018.8521334},
  doi          = {10.1109/IWAENC.2018.8521334},
  timestamp    = {Fri, 27 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iwaenc/UenoKS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwaenc/TakamichiSTKS18,
  author       = {Shinnosuke Takamichi and
                  Yuki Saito and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari},
  title        = {Phase Reconstruction from Amplitude Spectrograms Based on Von-Mises-Distribution
                  Deep Neural Network},
  booktitle    = {16th International Workshop on Acoustic Signal Enhancement, {IWAENC}
                  2018, Tokyo, Japan, September 17-20, 2018},
  pages        = {286--290},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/IWAENC.2018.8521313},
  doi          = {10.1109/IWAENC.2018.8521313},
  timestamp    = {Tue, 29 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iwaenc/TakamichiSTKS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lrec/TakamichiS18,
  author       = {Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  editor       = {Nicoletta Calzolari and
                  Khalid Choukri and
                  Christopher Cieri and
                  Thierry Declerck and
                  Sara Goggi and
                  K{\^{o}}iti Hasida and
                  Hitoshi Isahara and
                  Bente Maegaard and
                  Joseph Mariani and
                  H{\'{e}}l{\`{e}}ne Mazo and
                  Asunci{\'{o}}n Moreno and
                  Jan Odijk and
                  Stelios Piperidis and
                  Takenobu Tokunaga},
  title        = {{CPJD} Corpus: Crowdsourced Parallel Speech Corpus of Japanese Dialects},
  booktitle    = {Proceedings of the Eleventh International Conference on Language Resources
                  and Evaluation, {LREC} 2018, Miyazaki, Japan, May 7-12, 2018},
  publisher    = {European Language Resources Association {(ELRA)}},
  year         = {2018},
  url          = {http://www.lrec-conf.org/proceedings/lrec2018/summaries/67.html},
  timestamp    = {Mon, 19 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/lrec/TakamichiS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-10307,
  author       = {Shinichi Mogami and
                  Hayato Sumino and
                  Daichi Kitamura and
                  Norihiro Takamune and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari and
                  Nobutaka Ono},
  title        = {Independent Deeply Learned Matrix Analysis for Multichannel Audio
                  Source Separation},
  journal      = {CoRR},
  volume       = {abs/1806.10307},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.10307},
  eprinttype    = {arXiv},
  eprint       = {1806.10307},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-10307.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-03474,
  author       = {Shinnosuke Takamichi and
                  Yuki Saito and
                  Norihiro Takamune and
                  Daichi Kitamura and
                  Hiroshi Saruwatari},
  title        = {Phase reconstruction from amplitude spectrograms based on von-Mises-distribution
                  deep neural network},
  journal      = {CoRR},
  volume       = {abs/1807.03474},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.03474},
  eprinttype    = {arXiv},
  eprint       = {1807.03474},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-03474.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/SaitoTS17,
  author       = {Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Voice Conversion Using Input-to-Output Highway Networks},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {100-D},
  number       = {8},
  pages        = {1925--1928},
  year         = {2017},
  url          = {https://doi.org/10.1587/transinf.2017EDL8034},
  doi          = {10.1587/TRANSINF.2017EDL8034},
  timestamp    = {Tue, 29 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ieicet/SaitoTS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jrm/BandoSOMIKITMYM17,
  author       = {Yoshiaki Bando and
                  Hiroshi Saruwatari and
                  Nobutaka Ono and
                  Shoji Makino and
                  Katsutoshi Itoyama and
                  Daichi Kitamura and
                  Masaru Ishimura and
                  Moe Takakusaki and
                  Narumi Mae and
                  Kouei Yamaoka and
                  Yutaro Matsui and
                  Yuichi Ambe and
                  Masashi Konyo and
                  Satoshi Tadokoro and
                  Kazuyoshi Yoshii and
                  Hiroshi G. Okuno},
  title        = {Low Latency and High Quality Two-Stage Human-Voice-Enhancement System
                  for a Hose-Shaped Rescue Robot},
  journal      = {J. Robotics Mechatronics},
  volume       = {29},
  number       = {1},
  pages        = {198--212},
  year         = {2017},
  url          = {https://doi.org/10.20965/jrm.2017.p0198},
  doi          = {10.20965/JRM.2017.P0198},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jrm/BandoSOMIKITMYM17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/MaeMMKOYS17,
  author       = {Narumi Mae and
                  Yoshiki Mitsui and
                  Shoji Makino and
                  Daichi Kitamura and
                  Nobutaka Ono and
                  Takeshi Yamada and
                  Hiroshi Saruwatari},
  title        = {Sound source localization using binaural difference for hose-shaped
                  rescue robot},
  booktitle    = {2017 Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2017, Kuala Lumpur, Malaysia,
                  December 12-15, 2017},
  pages        = {1621--1627},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/APSIPA.2017.8282292},
  doi          = {10.1109/APSIPA.2017.8282292},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/apsipa/MaeMMKOYS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/camsap/MitsuiKTSTK17,
  author       = {Yoshiki Mitsui and
                  Daichi Kitamura and
                  Norihiro Takamune and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Independent low-rank matrix analysis based on parametric majorization-equalization
                  algorithm},
  booktitle    = {2017 {IEEE} 7th International Workshop on Computational Advances in
                  Multi-Sensor Adaptive Processing, {CAMSAP} 2017, Cura{\c{c}}ao, The
                  Netherlands, December 10-13, 2017},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/CAMSAP.2017.8313107},
  doi          = {10.1109/CAMSAP.2017.8313107},
  timestamp    = {Wed, 16 Oct 2019 14:14:56 +0200},
  biburl       = {https://dblp.org/rec/conf/camsap/MitsuiKTSTK17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/KitamuraOS17,
  author       = {Daichi Kitamura and
                  Nobutaka Ono and
                  Hiroshi Saruwatari},
  title        = {Experimental analysis of optimal window length for independent low-rank
                  matrix analysis},
  booktitle    = {25th European Signal Processing Conference, {EUSIPCO} 2017, Kos, Greece,
                  August 28 - September 2, 2017},
  pages        = {1170--1174},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.23919/EUSIPCO.2017.8081392},
  doi          = {10.23919/EUSIPCO.2017.8081392},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/KitamuraOS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hscma/UenoKS17,
  author       = {Natsuki Ueno and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Listening-area-informed sound field reproduction with Gaussian prior
                  based on circular harmonic expansion},
  booktitle    = {Hands-free Speech Communications and Microphone Arrays, {HSCMA} 2017,
                  San Francisco, CA, USA, March 1-3, 2017},
  pages        = {196--200},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/HSCMA.2017.7895589},
  doi          = {10.1109/HSCMA.2017.7895589},
  timestamp    = {Wed, 16 Oct 2019 14:14:57 +0200},
  biburl       = {https://dblp.org/rec/conf/hscma/UenoKS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ica/MaeIMKOYS17,
  author       = {Narumi Mae and
                  Masaru Ishimura and
                  Shoji Makino and
                  Daichi Kitamura and
                  Nobutaka Ono and
                  Takeshi Yamada and
                  Hiroshi Saruwatari},
  editor       = {Petr Tichavsk{\'{y}} and
                  Massoud Babaie{-}Zadeh and
                  Olivier J. J. Michel and
                  Nad{\`{e}}ge Thirion{-}Moreau},
  title        = {Ego Noise Reduction for Hose-Shaped Rescue Robot Combining Independent
                  Low-Rank Matrix Analysis and Multichannel Noise Cancellation},
  booktitle    = {Latent Variable Analysis and Signal Separation - 13th International
                  Conference, {LVA/ICA} 2017, Grenoble, France, February 21-23, 2017,
                  Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {10169},
  pages        = {141--151},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-3-319-53547-0\_14},
  doi          = {10.1007/978-3-319-53547-0\_14},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ica/MaeIMKOYS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MitsuiKTOS17,
  author       = {Yoshiki Mitsui and
                  Daichi Kitamura and
                  Shinnosuke Takamichi and
                  Nobutaka Ono and
                  Hiroshi Saruwatari},
  title        = {Blind source separation based on independent low-rank matrix analysis
                  with sparse regularization for time-series activity},
  booktitle    = {2017 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2017, New Orleans, LA, USA, March 5-9, 2017},
  pages        = {21--25},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICASSP.2017.7951790},
  doi          = {10.1109/ICASSP.2017.7951790},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MitsuiKTOS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/UenoKS17,
  author       = {Natsuki Ueno and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Listening-area-informed sound field reproduction based on circular
                  harmonic expansion},
  booktitle    = {2017 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2017, New Orleans, LA, USA, March 5-9, 2017},
  pages        = {111--115},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICASSP.2017.7952128},
  doi          = {10.1109/ICASSP.2017.7952128},
  timestamp    = {Sat, 16 Sep 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/UenoKS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MurataKTS17,
  author       = {Naoki Murata and
                  Shoichi Koyama and
                  Norihiro Takamune and
                  Hiroshi Saruwatari},
  title        = {Spatio-temporal sparse sound field decomposition considering acoustic
                  source signal characteristics},
  booktitle    = {2017 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2017, New Orleans, LA, USA, March 5-9, 2017},
  pages        = {441--445},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICASSP.2017.7952194},
  doi          = {10.1109/ICASSP.2017.7952194},
  timestamp    = {Sat, 16 Sep 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MurataKTS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SaitoTS17,
  author       = {Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Training algorithm to deceive Anti-Spoofing Verification for DNN-based
                  speech synthesis},
  booktitle    = {2017 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2017, New Orleans, LA, USA, March 5-9, 2017},
  pages        = {4900--4904},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICASSP.2017.7953088},
  doi          = {10.1109/ICASSP.2017.7953088},
  timestamp    = {Tue, 29 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/SaitoTS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/MiyoshiSTS17,
  author       = {Hiroyuki Miyoshi and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  editor       = {Francisco Lacerda},
  title        = {Voice Conversion Using Sequence-to-Sequence Learning of Context Posterior
                  Probabilities},
  booktitle    = {Interspeech 2017, 18th Annual Conference of the International Speech
                  Communication Association, Stockholm, Sweden, August 20-24, 2017},
  pages        = {1268--1272},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-247},
  doi          = {10.21437/INTERSPEECH.2017-247},
  timestamp    = {Sun, 06 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/MiyoshiSTS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/TakamichiKS17,
  author       = {Shinnosuke Takamichi and
                  Tomoki Koriyama and
                  Hiroshi Saruwatari},
  editor       = {Francisco Lacerda},
  title        = {Sampling-Based Speech Parameter Generation Using Moment-Matching Networks},
  booktitle    = {Interspeech 2017, 18th Annual Conference of the International Speech
                  Communication Association, Stockholm, Sweden, August 20-24, 2017},
  pages        = {3961--3965},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-362},
  doi          = {10.21437/INTERSPEECH.2017-362},
  timestamp    = {Sun, 06 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/TakamichiKS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mlsp/MogamiKMTSO17,
  author       = {Shinichi Mogami and
                  Daichi Kitamura and
                  Yoshiki Mitsui and
                  Norihiro Takamune and
                  Hiroshi Saruwatari and
                  Nobutaka Ono},
  editor       = {Naonori Ueda and
                  Shinji Watanabe and
                  Tomoko Matsui and
                  Jen{-}Tzung Chien and
                  Jan Larsen},
  title        = {Independent low-rank matrix analysis based on complex student's t-distribution
                  for blind audio source separation},
  booktitle    = {27th {IEEE} International Workshop on Machine Learning for Signal
                  Processing, {MLSP} 2017, Tokyo, Japan, September 25-28, 2017},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/MLSP.2017.8168129},
  doi          = {10.1109/MLSP.2017.8168129},
  timestamp    = {Tue, 30 Jun 2020 10:25:30 +0200},
  biburl       = {https://dblp.org/rec/conf/mlsp/MogamiKMTSO17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MiyoshiSTS17,
  author       = {Hiroyuki Miyoshi and
                  Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Voice Conversion Using Sequence-to-Sequence Learning of Context Posterior
                  Probabilities},
  journal      = {CoRR},
  volume       = {abs/1704.02360},
  year         = {2017},
  url          = {http://arxiv.org/abs/1704.02360},
  eprinttype    = {arXiv},
  eprint       = {1704.02360},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/MiyoshiSTS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/TakamichiKS17,
  author       = {Shinnosuke Takamichi and
                  Tomoki Koriyama and
                  Hiroshi Saruwatari},
  title        = {Sampling-based speech parameter generation using moment-matching networks},
  journal      = {CoRR},
  volume       = {abs/1704.03626},
  year         = {2017},
  url          = {http://arxiv.org/abs/1704.03626},
  eprinttype    = {arXiv},
  eprint       = {1704.03626},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/TakamichiKS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-04795,
  author       = {Shinichi Mogami and
                  Daichi Kitamura and
                  Yoshiki Mitsui and
                  Norihiro Takamune and
                  Hiroshi Saruwatari and
                  Nobutaka Ono},
  title        = {Independent Low-Rank Matrix Analysis Based on Complex Student's t-Distribution
                  for Blind Audio Source Separation},
  journal      = {CoRR},
  volume       = {abs/1708.04795},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.04795},
  eprinttype    = {arXiv},
  eprint       = {1708.04795},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-04795.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1709-08041,
  author       = {Yuki Saito and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {Statistical Parametric Speech Synthesis Incorporating Generative Adversarial
                  Networks},
  journal      = {CoRR},
  volume       = {abs/1709.08041},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.08041},
  eprinttype    = {arXiv},
  eprint       = {1709.08041},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-08041.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1710-01589,
  author       = {Yoshiki Mitsui and
                  Daichi Kitamura and
                  Norihiro Takamune and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Independent Low-Rank Matrix Analysis Based on Parametric Majorization-Equalization
                  Algorithm},
  journal      = {CoRR},
  volume       = {abs/1710.01589},
  year         = {2017},
  url          = {http://arxiv.org/abs/1710.01589},
  eprinttype    = {arXiv},
  eprint       = {1710.01589},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1710-01589.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-00354,
  author       = {Ryosuke Sonobe and
                  Shinnosuke Takamichi and
                  Hiroshi Saruwatari},
  title        = {{JSUT} corpus: free large-scale Japanese speech corpus for end-to-end
                  speech synthesis},
  journal      = {CoRR},
  volume       = {abs/1711.00354},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.00354},
  eprinttype    = {arXiv},
  eprint       = {1711.00354},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-00354.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/KitamuraOSKS16,
  author       = {Daichi Kitamura and
                  Nobutaka Ono and
                  Hiroshi Sawada and
                  Hirokazu Kameoka and
                  Hiroshi Saruwatari},
  title        = {Determined Blind Source Separation Unifying Independent Vector Analysis
                  and Nonnegative Matrix Factorization},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {24},
  number       = {9},
  pages        = {1626--1641},
  year         = {2016},
  url          = {https://doi.org/10.1109/TASLP.2016.2577880},
  doi          = {10.1109/TASLP.2016.2577880},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/KitamuraOSKS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/NakajimaKTKSTK16,
  author       = {Hiroaki Nakajima and
                  Daichi Kitamura and
                  Norihiro Takamune and
                  Shoichi Koyama and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Audio signal separation using supervised {NMF} with time-variant all-pole-model-based
                  basis deformation},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} 2016, Jeju, South Korea, December
                  13-16, 2016},
  pages        = {1--7},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/APSIPA.2016.7820763},
  doi          = {10.1109/APSIPA.2016.7820763},
  timestamp    = {Wed, 16 Oct 2019 14:14:55 +0200},
  biburl       = {https://dblp.org/rec/conf/apsipa/NakajimaKTKSTK16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/NakajimaKTKSOTK16,
  author       = {Hiroaki Nakajima and
                  Daichi Kitamura and
                  Norihiro Takamune and
                  Shoichi Koyama and
                  Hiroshi Saruwatari and
                  Nobutaka Ono and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Music signal separation using supervised {NMF} with all-pole-model-based
                  discriminative basis deformation},
  booktitle    = {24th European Signal Processing Conference, {EUSIPCO} 2016, Budapest,
                  Hungary, August 29 - September 2, 2016},
  pages        = {1143--1147},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/EUSIPCO.2016.7760427},
  doi          = {10.1109/EUSIPCO.2016.7760427},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/NakajimaKTKSOTK16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/MurataKKANKS16,
  author       = {Naoki Murata and
                  Hirokazu Kameoka and
                  Keisuke Kinoshita and
                  Shoko Araki and
                  Tomohiro Nakatani and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Reverberation-robust underdetermined source separation with non-negative
                  tensor double deconvolution},
  booktitle    = {24th European Signal Processing Conference, {EUSIPCO} 2016, Budapest,
                  Hungary, August 29 - September 2, 2016},
  pages        = {1648--1652},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/EUSIPCO.2016.7760528},
  doi          = {10.1109/EUSIPCO.2016.7760528},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eusipco/MurataKKANKS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MitsufujiKS16,
  author       = {Yuki Mitsufuji and
                  Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Multichannel blind source separation based on non-negative tensor
                  factorization in wavenumber domain},
  booktitle    = {2016 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2016, Shanghai, China, March 20-25, 2016},
  pages        = {56--60},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/ICASSP.2016.7471636},
  doi          = {10.1109/ICASSP.2016.7471636},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MitsufujiKS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MurataKKTS16,
  author       = {Naoki Murata and
                  Shoichi Koyama and
                  Hirokazu Kameoka and
                  Norihiro Takamune and
                  Hiroshi Saruwatari},
  title        = {Sparse sound field decomposition with multichannel extension of complex
                  {NMF}},
  booktitle    = {2016 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2016, Shanghai, China, March 20-25, 2016},
  pages        = {345--349},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/ICASSP.2016.7471694},
  doi          = {10.1109/ICASSP.2016.7471694},
  timestamp    = {Sat, 16 Sep 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MurataKKTS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KoyamaS16,
  author       = {Shoichi Koyama and
                  Hiroshi Saruwatari},
  title        = {Sound field decomposition in reverberant environment using sparse
                  and low-rank signal models},
  booktitle    = {2016 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2016, Shanghai, China, March 20-25, 2016},
  pages        = {395--399},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/ICASSP.2016.7471704},
  doi          = {10.1109/ICASSP.2016.7471704},
  timestamp    = {Sat, 16 Sep 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KoyamaS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LiKHS16,
  author       = {Li Li and
                  Hirokazu Kameoka and
                  Takuya Higuchi and
                  Hiroshi Saruwatari},
  editor       = {Nelson Morgan},
  title        = {Semi-Supervised Joint Enhancement of Spectral and Cepstral Sequences
                  of Noisy Speech},
  booktitle    = {Interspeech 2016, 17th Annual Conference of the International Speech
                  Communication Association, San Francisco, CA, USA, September 8-12,
                  2016},
  pages        = {3753--3757},
  publisher    = {{ISCA}},
  year         = {2016},
  url          = {https://doi.org/10.21437/Interspeech.2016-1286},
  doi          = {10.21437/INTERSPEECH.2016-1286},
  timestamp    = {Mon, 26 Jun 2023 16:43:56 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/LiKHS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwaenc/IshimuraMYOS16,
  author       = {Masaru Ishimura and
                  Shoji Makino and
                  Takeshi Yamada and
                  Nobutaka Ono and
                  Hiroshi Saruwatari},
  title        = {Noise reduction using independent vector analysis and noise cancellation
                  for a hose-shaped rescue robot},
  booktitle    = {{IEEE} International Workshop on Acoustic Signal Enhancement, {IWAENC}
                  2016, Xi'an, China, September 13-16, 2016},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/IWAENC.2016.7602912},
  doi          = {10.1109/IWAENC.2016.7602912},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iwaenc/IshimuraMYOS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwaenc/KitamuraOSTK16,
  author       = {Daichi Kitamura and
                  Nobutaka Ono and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Discriminative and reconstructive basis training for audio source
                  separation with semi-supervised nonnegative matrix factorization},
  booktitle    = {{IEEE} International Workshop on Acoustic Signal Enhancement, {IWAENC}
                  2016, Xi'an, China, September 13-16, 2016},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/IWAENC.2016.7602901},
  doi          = {10.1109/IWAENC.2016.7602901},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iwaenc/KitamuraOSTK16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwaenc/TakakusakiKOYMS16,
  author       = {Moe Takakusaki and
                  Daichi Kitamura and
                  Nobutaka Ono and
                  Takeshi Yamada and
                  Shoji Makino and
                  Hiroshi Saruwatari},
  title        = {Ego-noise reduction for a hose-shaped rescue robot using determined
                  rank-1 multichannel nonnegative matrix factorization},
  booktitle    = {{IEEE} International Workshop on Acoustic Signal Enhancement, {IWAENC}
                  2016, Xi'an, China, September 13-16, 2016},
  pages        = {1--4},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/IWAENC.2016.7602914},
  doi          = {10.1109/IWAENC.2016.7602914},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iwaenc/TakakusakiKOYMS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/KitamuraSKTKN15,
  author       = {Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Hirokazu Kameoka and
                  Yu Takahashi and
                  Kazunobu Kondo and
                  Satoshi Nakamura},
  title        = {Multichannel Signal Separation Combining Directional Clustering and
                  Nonnegative Matrix Factorization with Spectrogram Restoration},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {23},
  number       = {4},
  pages        = {654--669},
  year         = {2015},
  url          = {https://doi.org/10.1109/TASLP.2015.2401425},
  doi          = {10.1109/TASLP.2015.2401425},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/KitamuraSKTKN15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/KoyamaMMS15,
  author       = {Shoichi Koyama and
                  Atsushi Matsubayashi and
                  Naoki Murata and
                  Hiroshi Saruwatari},
  title        = {Sparse sound field decomposition using group sparse Bayesian learning},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} 2015, Hong Kong, December 16-19, 2015},
  pages        = {850--855},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/APSIPA.2015.7415391},
  doi          = {10.1109/APSIPA.2015.7415391},
  timestamp    = {Wed, 16 Oct 2019 14:14:55 +0200},
  biburl       = {https://dblp.org/rec/conf/apsipa/KoyamaMMS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/camsap/MurataKTS15,
  author       = {Naoki Murata and
                  Shoichi Koyama and
                  Norihiro Takamune and
                  Hiroshi Saruwatari},
  title        = {Sparse sound field decomposition with parametric dictionary learning
                  for super-resolution recording and reproduction},
  booktitle    = {6th {IEEE} International Workshop on Computational Advances in Multi-Sensor
                  Adaptive Processing, {CAMSAP} 2015, Cancun, Mexico, December 13-16,
                  2015},
  pages        = {69--72},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/CAMSAP.2015.7383738},
  doi          = {10.1109/CAMSAP.2015.7383738},
  timestamp    = {Wed, 16 Oct 2019 14:14:56 +0200},
  biburl       = {https://dblp.org/rec/conf/camsap/MurataKTS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/KitamuraOSKS15,
  author       = {Daichi Kitamura and
                  Nobutaka Ono and
                  Hiroshi Sawada and
                  Hirokazu Kameoka and
                  Hiroshi Saruwatari},
  title        = {Relaxation of rank-1 spatial constraint in overdetermined blind source
                  separation},
  booktitle    = {23rd European Signal Processing Conference, {EUSIPCO} 2015, Nice,
                  France, August 31 - September 4, 2015},
  pages        = {1261--1265},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/EUSIPCO.2015.7362586},
  doi          = {10.1109/EUSIPCO.2015.7362586},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/KitamuraOSKS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KitamuraOSKS15,
  author       = {Daichi Kitamura and
                  Nobutaka Ono and
                  Hiroshi Sawada and
                  Hirokazu Kameoka and
                  Hiroshi Saruwatari},
  title        = {Efficient multichannel nonnegative matrix factorization exploiting
                  rank-1 spatial model},
  booktitle    = {2015 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2015, South Brisbane, Queensland, Australia,
                  April 19-24, 2015},
  pages        = {276--280},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/ICASSP.2015.7177975},
  doi          = {10.1109/ICASSP.2015.7177975},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KitamuraOSKS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MurotaKKSN15,
  author       = {Yuki Murota and
                  Daichi Kitamura and
                  Shoichi Koyama and
                  Hiroshi Saruwatari and
                  Satoshi Nakamura},
  title        = {Statistical modeling of binaural signal and its application to binaural
                  source separation},
  booktitle    = {2015 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2015, South Brisbane, Queensland, Australia,
                  April 19-24, 2015},
  pages        = {494--498},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/ICASSP.2015.7178018},
  doi          = {10.1109/ICASSP.2015.7178018},
  timestamp    = {Sat, 16 Sep 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MurotaKKSN15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KoyamaMS15,
  author       = {Shoichi Koyama and
                  Naoki Murata and
                  Hiroshi Saruwatari},
  title        = {Structured sparse signal models and decomposition algorithm for super-resolution
                  in sound field recording and reproduction},
  booktitle    = {2015 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2015, South Brisbane, Queensland, Australia,
                  April 19-24, 2015},
  pages        = {619--623},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/ICASSP.2015.7178043},
  doi          = {10.1109/ICASSP.2015.7178043},
  timestamp    = {Sat, 16 Sep 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KoyamaMS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icdsp/Saruwatari15,
  author       = {Hiroshi Saruwatari},
  title        = {Statistical-model-based speech enhancement with musical-noise-free
                  properties},
  booktitle    = {2015 {IEEE} International Conference on Digital Signal Processing,
                  {DSP} 2015, Singapore, July 21-24, 2015},
  pages        = {1201--1205},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/ICDSP.2015.7252070},
  doi          = {10.1109/ICDSP.2015.7252070},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/icdsp/Saruwatari15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/waspaa/KoyamaIS15,
  author       = {Shoichi Koyama and
                  Koichiro Ito and
                  Hiroshi Saruwatari},
  title        = {Source-location-informed sound field recording and reproduction with
                  spherical arrays},
  booktitle    = {2015 {IEEE} Workshop on Applications of Signal Processing to Audio
                  and Acoustics, {WASPAA} 2015, New Paltz, NY, USA, October 18-21, 2015},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/WASPAA.2015.7336914},
  doi          = {10.1109/WASPAA.2015.7336914},
  timestamp    = {Wed, 16 Oct 2019 14:14:57 +0200},
  biburl       = {https://dblp.org/rec/conf/waspaa/KoyamaIS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/KitamuraSYSTK14,
  author       = {Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Kosuke Yagi and
                  Kiyohiro Shikano and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Music Signal Separation Based on Supervised Nonnegative Matrix Factorization
                  with Orthogonality and Maximum-Divergence Penalties},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {97-A},
  number       = {5},
  pages        = {1113--1118},
  year         = {2014},
  url          = {https://doi.org/10.1587/transfun.E97.A.1113},
  doi          = {10.1587/TRANSFUN.E97.A.1113},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ieicet/KitamuraSYSTK14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/sigpro/MiyazakiSNSKBB14,
  author       = {Ryoichi Miyazaki and
                  Hiroshi Saruwatari and
                  Satoshi Nakamura and
                  Kiyohiro Shikano and
                  Kazunobu Kondo and
                  Jonathan Blanchette and
                  Martin Bouchard},
  title        = {Musical-noise-free blind speech extraction integrating microphone
                  array and iterative spectral subtraction},
  journal      = {Signal Process.},
  volume       = {102},
  pages        = {226--239},
  year         = {2014},
  url          = {https://doi.org/10.1016/j.sigpro.2014.03.010},
  doi          = {10.1016/J.SIGPRO.2014.03.010},
  timestamp    = {Sat, 22 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/sigpro/MiyazakiSNSKBB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/DoiTNSS14,
  author       = {Hironori Doi and
                  Tomoki Toda and
                  Keigo Nakamura and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Alaryngeal Speech Enhancement Based on One-to-Many Eigenvoice Conversion},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {22},
  number       = {1},
  pages        = {172--183},
  year         = {2014},
  url          = {https://doi.org/10.1109/TASLP.2013.2286917},
  doi          = {10.1109/TASLP.2013.2286917},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/DoiTNSS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/KitamuraSNTKK14,
  author       = {Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Satoshi Nakamura and
                  Yu Takahashi and
                  Kazunobu Kondo and
                  Hirokazu Kameoka},
  title        = {Hybrid multichannel signal separation using supervised nonnegative
                  matrix factorization with spectrogram restoration},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} 2014, Chiang Mai, Thailand, December
                  9-12, 2014},
  pages        = {1--10},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/APSIPA.2014.7041664},
  doi          = {10.1109/APSIPA.2014.7041664},
  timestamp    = {Wed, 16 Oct 2019 14:14:55 +0200},
  biburl       = {https://dblp.org/rec/conf/apsipa/KitamuraSNTKK14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hscma/KitamuraSNTKK14,
  author       = {Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Satoshi Nakamura and
                  Yu Takahashi and
                  Kazunobu Kondo and
                  Hirokazu Kameoka},
  title        = {Divergence optimization in nonnegative matrix factorization with spectrogram
                  restoration for multichannel signal separation},
  booktitle    = {4th Joint Workshop on Hands-free Speech Communication and Microphone
                  Arrays, {HSCMA} 2014, Villers-les-Nancy, France, May 12-14, 2014},
  pages        = {92--96},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/HSCMA.2014.6843258},
  doi          = {10.1109/HSCMA.2014.6843258},
  timestamp    = {Wed, 16 Oct 2019 14:14:57 +0200},
  biburl       = {https://dblp.org/rec/conf/hscma/KitamuraSNTKK14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hscma/NakaiSMNK14,
  author       = {Shunsuke Nakai and
                  Hiroshi Saruwatari and
                  Ryoichi Miyazaki and
                  Satoshi Nakamura and
                  Kazunobu Kondo},
  title        = {Theoretical analysis of biased {MMSE} short-time spectral amplitude
                  estimator and its extension to musical-noise-free speech enhancement},
  booktitle    = {4th Joint Workshop on Hands-free Speech Communication and Microphone
                  Arrays, {HSCMA} 2014, Villers-les-Nancy, France, May 12-14, 2014},
  pages        = {122--126},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/HSCMA.2014.6843264},
  doi          = {10.1109/HSCMA.2014.6843264},
  timestamp    = {Thu, 24 Aug 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/hscma/NakaiSMNK14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hscma/AprilyantiSNT14,
  author       = {Fine Dwinita Aprilyanti and
                  Hiroshi Saruwatari and
                  Satoshi Nakamura and
                  Tomoya Takatani},
  title        = {Optimized joint noise suppression and dereverberation based on blind
                  signal extraction for hands-free speech recognition system},
  booktitle    = {4th Joint Workshop on Hands-free Speech Communication and Microphone
                  Arrays, {HSCMA} 2014, Villers-les-Nancy, France, May 12-14, 2014},
  pages        = {182--186},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/HSCMA.2014.6843276},
  doi          = {10.1109/HSCMA.2014.6843276},
  timestamp    = {Thu, 24 Aug 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/hscma/AprilyantiSNT14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MurotaKNSNTK14,
  author       = {Yuki Murota and
                  Daichi Kitamura and
                  Shunsuke Nakai and
                  Hiroshi Saruwatari and
                  Satoshi Nakamura and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Music signal separation based on Bayesian spectral amplitude estimator
                  with automatic target prior adaptation},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2014, Florence, Italy, May 4-9, 2014},
  pages        = {7490--7494},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ICASSP.2014.6855056},
  doi          = {10.1109/ICASSP.2014.6855056},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MurotaKNSNTK14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/sigpro/MustiereBNPTS13,
  author       = {Fr{\'{e}}d{\'{e}}ric Musti{\`{e}}re and
                  Martin Bouchard and
                  Hossein Najaf{-}Zadeh and
                  Ramin Pichevar and
                  Louis Thibault and
                  Hiroshi Saruwatari},
  title        = {Design of multichannel frequency domain statistical-based enhancement
                  systems preserving spatial cues via spectral distances minimization},
  journal      = {Signal Process.},
  volume       = {93},
  number       = {1},
  pages        = {321--325},
  year         = {2013},
  url          = {https://doi.org/10.1016/j.sigpro.2012.06.024},
  doi          = {10.1016/J.SIGPRO.2012.06.024},
  timestamp    = {Sat, 22 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/sigpro/MustiereBNPTS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/AprilyantiSSNT13,
  author       = {Fine Dwinita Aprilyanti and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Satoshi Nakamura and
                  Tomoya Takatani},
  title        = {Semi-blind algorithm for joint noise suppression and dereverberation
                  based on higher-order statistics and acoustic model likelihood},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} 2013, Kaohsiung, Taiwan, October 29
                  - November 1, 2013},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/APSIPA.2013.6694161},
  doi          = {10.1109/APSIPA.2013.6694161},
  timestamp    = {Wed, 16 Oct 2019 14:14:55 +0200},
  biburl       = {https://dblp.org/rec/conf/apsipa/AprilyantiSSNT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/MiyazakiSNSKBB13,
  author       = {Ryoichi Miyazaki and
                  Hiroshi Saruwatari and
                  Satoshi Nakamura and
                  Kiyohiro Shikano and
                  Kazunobu Kondo and
                  Jonathan Blanchette and
                  Martin Bouchard},
  title        = {Toward musical-noise-free blind speech extraction: Concept and its
                  applications},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} 2013, Kaohsiung, Taiwan, October 29
                  - November 1, 2013},
  pages        = {1--10},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/APSIPA.2013.6694291},
  doi          = {10.1109/APSIPA.2013.6694291},
  timestamp    = {Thu, 26 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/apsipa/MiyazakiSNSKBB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icdsp/KitamuraSISKT13,
  author       = {Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Yusuke Iwao and
                  Kiyohiro Shikano and
                  Kazunobu Kondo and
                  Yu Takahashi},
  title        = {Superresolution-based stereo signal separation via supervised nonnegative
                  matrix factorization},
  booktitle    = {18th International Conference on Digital Signal Processing, {DSP}
                  2013, Fira, Santorini, Greece, July 1-3, 2013},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICDSP.2013.6622684},
  doi          = {10.1109/ICDSP.2013.6622684},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/icdsp/KitamuraSISKT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icdsp/KitamuraSSKT13,
  author       = {Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Kazunobu Kondo and
                  Yu Takahashi},
  title        = {Music signal separation by supervised nonnegative matrix factorization
                  with basis deformation},
  booktitle    = {18th International Conference on Digital Signal Processing, {DSP}
                  2013, Fira, Santorini, Greece, July 1-3, 2013},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICDSP.2013.6622812},
  doi          = {10.1109/ICDSP.2013.6622812},
  timestamp    = {Wed, 24 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icdsp/KitamuraSSKT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SaruwatariKMSK13,
  author       = {Hiroshi Saruwatari and
                  Suzumi Kanehara and
                  Ryoichi Miyazaki and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  editor       = {Fr{\'{e}}d{\'{e}}ric Bimbot and
                  Christophe Cerisara and
                  C{\'{e}}cile Fougeron and
                  Guillaume Gravier and
                  Lori Lamel and
                  Fran{\c{c}}ois Pellegrino and
                  Pascal Perrier},
  title        = {Musical noise analysis for Bayesian minimum mean-square error speech
                  amplitude estimators based on higher-order statistics},
  booktitle    = {{INTERSPEECH} 2013, 14th Annual Conference of the International Speech
                  Communication Association, Lyon, France, August 25-29, 2013},
  pages        = {441--445},
  publisher    = {{ISCA}},
  year         = {2013},
  url          = {https://doi.org/10.21437/Interspeech.2013-131},
  doi          = {10.21437/INTERSPEECH.2013-131},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SaruwatariKMSK13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ispacs/SaruwatariM13,
  author       = {Hiroshi Saruwatari and
                  Ryoichi Miyazaki},
  title        = {Information-geometric optimization for nonlinear noise reduction systems},
  booktitle    = {International Symposium on Intelligent Signal Processing and Communication
                  Systems, {ISPACS} 2013, Naha-shi, Japan, November 12-15, 2013},
  pages        = {192--197},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ISPACS.2013.6704545},
  doi          = {10.1109/ISPACS.2013.6704545},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/ispacs/SaruwatariM13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isspit/KitamuraSYSTK13,
  author       = {Daichi Kitamura and
                  Hiroshi Saruwatari and
                  Kosuke Yagi and
                  Kiyohiro Shikano and
                  Yu Takahashi and
                  Kazunobu Kondo},
  title        = {Robust music signal separation based on supervised nonnegative matrix
                  factorization with prevention of basis sharing},
  booktitle    = {{IEEE} International Symposium on Signal Processing and Information
                  Technology, Athens, Greece, December 12-15, 2013},
  pages        = {392--397},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/ISSPIT.2013.6781913},
  doi          = {10.1109/ISSPIT.2013.6781913},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/isspit/KitamuraSYSTK13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/MiyazakiSS12,
  author       = {Ryoichi Miyazaki and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Theoretical Analysis of Amounts of Musical Noise and Speech Distortion
                  in Structure-Generalized Parametric Blind Spatial Subtraction Array},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {95-A},
  number       = {2},
  pages        = {586--590},
  year         = {2012},
  url          = {https://doi.org/10.1587/transfun.E95.A.586},
  doi          = {10.1587/TRANSFUN.E95.A.586},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/MiyazakiSS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/WakisakaSST12,
  author       = {Ryo Wakisaka and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Tomoya Takatani},
  title        = {Speech Prior Estimation for Generalized Minimum Mean-Square Error
                  Short-Time Spectral Amplitude Estimator},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {95-A},
  number       = {2},
  pages        = {591--595},
  year         = {2012},
  url          = {https://doi.org/10.1587/transfun.E95.A.591},
  doi          = {10.1587/TRANSFUN.E95.A.591},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/WakisakaSST12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/speech/NakamuraTSS12,
  author       = {Keigo Nakamura and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Speaking-aid systems using GMM-based voice conversion for electrolaryngeal
                  speech},
  journal      = {Speech Commun.},
  volume       = {54},
  number       = {1},
  pages        = {134--146},
  year         = {2012},
  url          = {https://doi.org/10.1016/j.specom.2011.07.007},
  doi          = {10.1016/J.SPECOM.2011.07.007},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/speech/NakamuraTSS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/MiyazakiSITSK12,
  author       = {Ryoichi Miyazaki and
                  Hiroshi Saruwatari and
                  Takayuki Inoue and
                  Yu Takahashi and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  title        = {Musical-Noise-Free Speech Enhancement Based on Optimized Iterative
                  Spectral Subtraction},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {20},
  number       = {7},
  pages        = {2080--2094},
  year         = {2012},
  url          = {https://doi.org/10.1109/TASL.2012.2196513},
  doi          = {10.1109/TASL.2012.2196513},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/MiyazakiSITSK12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/AprilyantiSST12,
  author       = {Fine Dwinita Aprilyanti and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Tomoya Takatani},
  title        = {Optimization scheme of joint noise suppression and dereverberation
                  based on higher-order statistics},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} 2012, Hollywood, CA, USA, December
                  3-6, 2012},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://ieeexplore.ieee.org/document/6411822/},
  timestamp    = {Sun, 08 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/apsipa/AprilyantiSST12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/KaneharaSMSK12,
  author       = {Suzumi Kanehara and
                  Hiroshi Saruwatari and
                  Ryoichi Miyazaki and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  title        = {Comparative study on various noise reduction methods with decision-directed
                  a priori {SNR} estimator via higher-order statistics},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} 2012, Hollywood, CA, USA, December
                  3-6, 2012},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://ieeexplore.ieee.org/document/6411806/},
  timestamp    = {Sun, 08 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/apsipa/KaneharaSMSK12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/NishimuraKSS12,
  author       = {Kazuma Nishimura and
                  Hiromichi Kawanami and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Response generation based on statistical machine translation for speech-oriented
                  guidance system},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} 2012, Hollywood, CA, USA, December
                  3-6, 2012},
  pages        = {1--4},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://ieeexplore.ieee.org/document/6411808/},
  timestamp    = {Sun, 08 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/apsipa/NishimuraKSS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/OnumaKSS12,
  author       = {Yuji Onuma and
                  Noriyoshi Kamado and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Real-time semi-blind speech extraction with speaker direction tracking
                  on Kinect},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} 2012, Hollywood, CA, USA, December
                  3-6, 2012},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://ieeexplore.ieee.org/document/6411817/},
  timestamp    = {Sun, 08 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/apsipa/OnumaKSS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/TakahashiMSK12,
  author       = {Yu Takahashi and
                  Ryoichi Miyazaki and
                  Hiroshi Saruwatari and
                  Kazunobu Kondo},
  title        = {Theoretical analysis of musical noise in nonlinear noise reduction
                  based on higher-order statistics},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} 2012, Hollywood, CA, USA, December
                  3-6, 2012},
  pages        = {1--10},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://ieeexplore.ieee.org/document/6411877/},
  timestamp    = {Sun, 08 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/apsipa/TakahashiMSK12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/SaruwatariWSMTNB12,
  author       = {Hiroshi Saruwatari and
                  Ryo Wakisaka and
                  Kiyohiro Shikano and
                  Fr{\'{e}}d{\'{e}}ric Musti{\`{e}}re and
                  Louis Thibault and
                  Hossein Najaf{-}Zadeh and
                  Martin Bouchard},
  title        = {Sound-localization-preserved binaural {MMSE} {STSA} estimator with
                  explicit and implicit binaural cues},
  booktitle    = {Proceedings of the 20th European Signal Processing Conference, {EUSIPCO}
                  2012, Bucharest, Romania, August 27-31, 2012},
  pages        = {310--314},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://ieeexplore.ieee.org/document/6334345/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/SaruwatariWSMTNB12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/KamadoHSS12,
  author       = {Noriyoshi Kamado and
                  Masayuki Hirata and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Object-based stereo up-mixer for wave field synthesis based on spatial
                  information clustering},
  booktitle    = {Proceedings of the 20th European Signal Processing Conference, {EUSIPCO}
                  2012, Bucharest, Romania, August 27-31, 2012},
  pages        = {594--598},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://ieeexplore.ieee.org/document/6334180/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/KamadoHSS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/WakisakaSST12,
  author       = {Ryo Wakisaka and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Tomoya Takatani},
  title        = {Speech kurtosis estimation from observed noisy signal based on generalized
                  Gaussian distribution prior and additivity of cumulants},
  booktitle    = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
  pages        = {4049--4052},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICASSP.2012.6288807},
  doi          = {10.1109/ICASSP.2012.6288807},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/WakisakaSST12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/YamamotoTDSS12,
  author       = {Kenzo Yamamoto and
                  Tomoki Toda and
                  Hironori Doi and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Statistical approach to voice quality control in esophageal speech
                  enhancement},
  booktitle    = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
  pages        = {4497--4500},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICASSP.2012.6287949},
  doi          = {10.1109/ICASSP.2012.6287949},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/YamamotoTDSS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MiyazakiSISK12,
  author       = {Ryoichi Miyazaki and
                  Hiroshi Saruwatari and
                  Takayuki Inoue and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  title        = {Musical-noise-free speech enhancement: Theory and evaluation},
  booktitle    = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
  pages        = {4565--4568},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICASSP.2012.6288934},
  doi          = {10.1109/ICASSP.2012.6288934},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MiyazakiSISK12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/MajimaTFKMSS12,
  author       = {Haruka Majima and
                  Rafael Torres and
                  Yoko Fujita and
                  Hiromichi Kawanami and
                  Tomoko Matsui and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Spoken Inquiry Discrimination Using Bag-of-Words for Speech-Oriented
                  Guidance System},
  booktitle    = {{INTERSPEECH} 2012, 13th Annual Conference of the International Speech
                  Communication Association, Portland, Oregon, USA, September 9-13,
                  2012},
  pages        = {2097--2100},
  publisher    = {{ISCA}},
  year         = {2012},
  url          = {https://doi.org/10.21437/Interspeech.2012-559},
  doi          = {10.21437/INTERSPEECH.2012-559},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/MajimaTFKMSS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/KuboKSS12,
  author       = {Keigo Kubo and
                  Hiromichi Kawanami and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Evaluation of Many-to-Many Alignment Algorithm by Automatic Pronunciation
                  Annotation Using Web Text Mining},
  booktitle    = {{INTERSPEECH} 2012, 13th Annual Conference of the International Speech
                  Communication Association, Portland, Oregon, USA, September 9-13,
                  2012},
  pages        = {2318--2321},
  publisher    = {{ISCA}},
  year         = {2012},
  url          = {https://doi.org/10.21437/Interspeech.2012-608},
  doi          = {10.21437/INTERSPEECH.2012-608},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/KuboKSS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isspa/MiyazakiSSK12,
  author       = {Ryoichi Miyazaki and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  title        = {Musical-noise-free blind speech extraction using ICA-based noise estimation
                  and iterative spectral subtraction},
  booktitle    = {11th International Conference on Information Science, Signal Processing
                  and their Applications, {ISSPA} 2012, Montreal, QC, Canada, July 2-5,
                  2012},
  pages        = {286--291},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ISSPA.2012.6310561},
  doi          = {10.1109/ISSPA.2012.6310561},
  timestamp    = {Wed, 16 Oct 2019 14:14:56 +0200},
  biburl       = {https://dblp.org/rec/conf/isspa/MiyazakiSSK12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isspit/ItoiMTSS12,
  author       = {Miyuki Itoi and
                  Ryoichi Miyazaki and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Blind speech extraction for Non-Audible Murmur speech with speaker's
                  movement noise},
  booktitle    = {{IEEE} International Symposium on Signal Processing and Information
                  Technology, {ISSPIT} 2012, Ho Chi Minh City, Vietnam, December 12-15,
                  2012},
  pages        = {320--325},
  publisher    = {{IEEE} Computer Society},
  year         = {2012},
  url          = {https://doi.org/10.1109/ISSPIT.2012.6621308},
  doi          = {10.1109/ISSPIT.2012.6621308},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/isspit/ItoiMTSS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwaenc/KaneharaSMSK12,
  author       = {Suzumi Kanehara and
                  Hiroshi Saruwatari and
                  Ryoichi Miyazaki and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  title        = {Theoretical Analysis of Musical Noise Generation in Noise Reduction
                  Methods with Decision-Directed a Priori {SNR} Estimator},
  booktitle    = {{IWAENC} 2012 - International Workshop on Acoustic Signal Enhancement,
                  Proceedings, {RWTH} Aachen University, Germany, September 4th - 6th,
                  2012},
  publisher    = {VDE-Verlag},
  year         = {2012},
  url          = {http://www.vde-verlag.de/proceedings-de/453451049.html},
  timestamp    = {Fri, 17 May 2013 18:34:53 +0200},
  biburl       = {https://dblp.org/rec/conf/iwaenc/KaneharaSMSK12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwaenc/MiyazakiSSK12,
  author       = {Ryoichi Miyazaki and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  title        = {Musical-Noise-Free Blind Speech Extraction Using ICA-Based Noise Estimation
                  with Channel Selection},
  booktitle    = {{IWAENC} 2012 - International Workshop on Acoustic Signal Enhancement,
                  Proceedings, {RWTH} Aachen University, Germany, September 4th - 6th,
                  2012},
  publisher    = {VDE-Verlag},
  year         = {2012},
  url          = {http://www.vde-verlag.de/proceedings-de/453451056.html},
  timestamp    = {Fri, 17 May 2013 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iwaenc/MiyazakiSSK12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwsds/HaraKSS12,
  author       = {Sunao Hara and
                  Hiromichi Kawanami and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Joseph Mariani and
                  Sophie Rosset and
                  Martine Garnier{-}Rizet and
                  Laurence Devillers},
  title        = {Development of a Toolkit Handling Multiple Speech-Oriented Guidance
                  Agents for Mobile Applications},
  booktitle    = {Natural Interaction with Robots, Knowbots and Smartphones, 4th International
                  Workshop on Spoken Dialogue Systems, {IWSDS} 2012, Paris, France,
                  November 28-30, 2012},
  pages        = {79--85},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-1-4614-8280-2\_8},
  doi          = {10.1007/978-1-4614-8280-2\_8},
  timestamp    = {Thu, 29 Apr 2021 13:34:52 +0200},
  biburl       = {https://dblp.org/rec/conf/iwsds/HaraKSS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwsds/TorresKMSS12,
  author       = {Rafael Torres and
                  Hiromichi Kawanami and
                  Tomoko Matsui and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Joseph Mariani and
                  Sophie Rosset and
                  Martine Garnier{-}Rizet and
                  Laurence Devillers},
  title        = {Topic Classification of Spoken Inquiries Using Transductive Support
                  Vector Machine},
  booktitle    = {Natural Interaction with Robots, Knowbots and Smartphones, 4th International
                  Workshop on Spoken Dialogue Systems, {IWSDS} 2012, Paris, France,
                  November 28-30, 2012},
  pages        = {261--267},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-1-4614-8280-2\_23},
  doi          = {10.1007/978-1-4614-8280-2\_23},
  timestamp    = {Thu, 29 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iwsds/TorresKMSS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwsds/MajimaTKHMSS12,
  author       = {Haruka Majima and
                  Rafael Torres and
                  Hiromichi Kawanami and
                  Sunao Hara and
                  Tomoko Matsui and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Joseph Mariani and
                  Sophie Rosset and
                  Martine Garnier{-}Rizet and
                  Laurence Devillers},
  title        = {Evaluation of Invalid Input Discrimination Using Bag-of-Words for
                  Speech-Oriented Guidance System},
  booktitle    = {Natural Interaction with Robots, Knowbots and Smartphones, 4th International
                  Workshop on Spoken Dialogue Systems, {IWSDS} 2012, Paris, France,
                  November 28-30, 2012},
  pages        = {389--397},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-1-4614-8280-2\_35},
  doi          = {10.1007/978-1-4614-8280-2\_35},
  timestamp    = {Thu, 29 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iwsds/MajimaTKHMSS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/KamadoHSSS11,
  author       = {Noriyoshi Kamado and
                  Haruhide Hokari and
                  Shoji Shimada and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Sound Field Reproduction by Wavefront Synthesis Using Directly Aligned
                  Multi Point Control},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {94-A},
  number       = {3},
  pages        = {907--920},
  year         = {2011},
  url          = {https://doi.org/10.1587/transfun.E94.A.907},
  doi          = {10.1587/TRANSFUN.E94.A.907},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/KamadoHSSS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/SaruwatariITISK11,
  author       = {Hiroshi Saruwatari and
                  Yohei Ishikawa and
                  Yu Takahashi and
                  Takayuki Inoue and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  title        = {Musical Noise Controllable Algorithm of Channelwise Spectral Subtraction
                  and Adaptive Beamforming Based on Higher Order Statistics},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {19},
  number       = {6},
  pages        = {1457--1466},
  year         = {2011},
  url          = {https://doi.org/10.1109/TASL.2010.2091636},
  doi          = {10.1109/TASL.2010.2091636},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/SaruwatariITISK11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/InoueSTSK11,
  author       = {Takayuki Inoue and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  title        = {Theoretical Analysis of Musical Noise in Generalized Spectral Subtraction
                  Based on Higher Order Statistics},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {19},
  number       = {6},
  pages        = {1770--1779},
  year         = {2011},
  url          = {https://doi.org/10.1109/TASL.2010.2098871},
  doi          = {10.1109/TASL.2010.2098871},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/InoueSTSK11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/IshiiTSSN11,
  author       = {Shunta Ishii and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Sakriani Sakti and
                  Satoshi Nakamura},
  editor       = {David Nahamoo and
                  Michael Picheny},
  title        = {Blind noise suppression for Non-Audible Murmur recognition with stereo
                  signal processing},
  booktitle    = {2011 {IEEE} Workshop on Automatic Speech Recognition {\&} Understanding,
                  {ASRU} 2011, Waikoloa, HI, USA, December 11-15, 2011},
  pages        = {494--499},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ASRU.2011.6163981},
  doi          = {10.1109/ASRU.2011.6163981},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/asru/IshiiTSSN11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/KondoTHSNT11,
  author       = {Kazunobu Kondo and
                  Yu Takahashi and
                  Seiichi Hashimoto and
                  Hiroshi Saruwatari and
                  Takanori Nishino and
                  Kazuya Takeda},
  title        = {Efficient blind speech separation suitable for embedded devices},
  booktitle    = {Proceedings of the 19th European Signal Processing Conference, {EUSIPCO}
                  2011, Barcelona, Spain, August 29 - Sept. 2, 2011},
  pages        = {2319--2323},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://ieeexplore.ieee.org/document/7074189/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/KondoTHSNT11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/NawataKSS11,
  author       = {Hiroyuki Nawata and
                  Noriyoshi Kamado and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Automatic musical thumbnailing based on audio object localization
                  and its evaluation},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress
                  Center, Prague, Czech Republic},
  pages        = {41--44},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ICASSP.2011.5946323},
  doi          = {10.1109/ICASSP.2011.5946323},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/NawataKSS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KamadoSS11,
  author       = {Noriyoshi Kamado and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Robust sound field reproduction integrating multi-point sound field
                  control and wave field synthesis},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress
                  Center, Prague, Czech Republic},
  pages        = {441--444},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ICASSP.2011.5946435},
  doi          = {10.1109/ICASSP.2011.5946435},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KamadoSS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/InoueSSK11,
  author       = {Takayuki Inoue and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  title        = {Theoretical analysis of musical noise in Wiener filtering family via
                  higher-order statistics},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress
                  Center, Prague, Czech Republic},
  pages        = {5076--5079},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ICASSP.2011.5947498},
  doi          = {10.1109/ICASSP.2011.5947498},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/InoueSSK11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/DoiNTSS11,
  author       = {Hironori Doi and
                  Keigo Nakamura and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {An evaluation of alaryngeal speech enhancement methods based on voice
                  conversion techniques},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress
                  Center, Prague, Czech Republic},
  pages        = {5136--5139},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ICASSP.2011.5947513},
  doi          = {10.1109/ICASSP.2011.5947513},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/DoiNTSS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BabaniTSS11,
  author       = {Denis Babani and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Acoustic model training for non-audible murmur recognition using transformed
                  normal speech data},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress
                  Center, Prague, Czech Republic},
  pages        = {5224--5227},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ICASSP.2011.5947535},
  doi          = {10.1109/ICASSP.2011.5947535},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/BabaniTSS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/MiyazakiSS11,
  author       = {Ryoichi Miyazaki and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Theoretical Analysis of Musical Noise and Speech Distortion in Structure-Generalized
                  Parametric Blind Spatial Subtraction Array},
  booktitle    = {{INTERSPEECH} 2011, 12th Annual Conference of the International Speech
                  Communication Association, Florence, Italy, August 27-31, 2011},
  pages        = {341--344},
  publisher    = {{ISCA}},
  year         = {2011},
  url          = {https://doi.org/10.21437/Interspeech.2011-125},
  doi          = {10.21437/INTERSPEECH.2011-125},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/MiyazakiSS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/WakisakaSST11,
  author       = {Ryo Wakisaka and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Tomoya Takatani},
  title        = {Blind Speech Prior Estimation for Generalized Minimum Mean-Square
                  Error Short-Time Spectral Amplitude Estimator},
  booktitle    = {{INTERSPEECH} 2011, 12th Annual Conference of the International Speech
                  Communication Association, Florence, Italy, August 27-31, 2011},
  pages        = {361--364},
  publisher    = {{ISCA}},
  year         = {2011},
  url          = {https://doi.org/10.21437/Interspeech.2011-130},
  doi          = {10.21437/INTERSPEECH.2011-130},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/WakisakaSST11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HattoriTKSS11,
  author       = {Nobuhiko Hattori and
                  Tomoki Toda and
                  Hisashi Kawai and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Speaker-Adaptive Speech Synthesis Based on Eigenvoice Conversion and
                  Language-Dependent Prosodic Conversion in Speech-to-Speech Translation},
  booktitle    = {{INTERSPEECH} 2011, 12th Annual Conference of the International Speech
                  Communication Association, Florence, Italy, August 27-31, 2011},
  pages        = {2769--2772},
  publisher    = {{ISCA}},
  year         = {2011},
  url          = {https://doi.org/10.21437/Interspeech.2011-693},
  doi          = {10.21437/INTERSPEECH.2011-693},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HattoriTKSS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isspit/SaruwatariHHWST11,
  author       = {Hiroshi Saruwatari and
                  Nobuhisa Hirata and
                  Toshiyuki Hatta and
                  Ryo Wakisaka and
                  Kiyohiro Shikano and
                  Tomoya Takatani},
  editor       = {Adel Elmaghraby and
                  Dimitrios N. Serpanos},
  title        = {Semi-blind speech extraction for robot using visual information and
                  noise statistics},
  booktitle    = {2011 {IEEE} International Symposium on Signal Processing and Information
                  Technology, {ISSPIT} 2011, Bilbao, Spain, December 14-17, 2011},
  pages        = {264--269},
  publisher    = {{IEEE} Computer Society},
  year         = {2011},
  url          = {https://doi.org/10.1109/ISSPIT.2011.6151571},
  doi          = {10.1109/ISSPIT.2011.6151571},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/isspit/SaruwatariHHWST11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ejasp/TakahashiSSK10,
  author       = {Yu Takahashi and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  title        = {Musical-Noise Analysis in Methods of Integrating Microphone Array
                  and Spectral Subtraction Based on Higher-Order Statistics},
  journal      = {{EURASIP} J. Adv. Signal Process.},
  volume       = {2010},
  year         = {2010},
  url          = {https://doi.org/10.1155/2010/431347},
  doi          = {10.1155/2010/431347},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ejasp/TakahashiSSK10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/OhtaniTSS10,
  author       = {Yamato Ohtani and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Adaptive Training for Voice Conversion Based on Eigenvoices},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {93-D},
  number       = {6},
  pages        = {1589--1598},
  year         = {2010},
  url          = {https://doi.org/10.1587/transinf.E93.D.1589},
  doi          = {10.1587/TRANSINF.E93.D.1589},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/OhtaniTSS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/NakamuraTSS10,
  author       = {Keigo Nakamura and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Evaluation of Extremely Small Sound Source Signals Used in Speaking-Aid
                  System with Statistical Voice Conversion},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {93-D},
  number       = {7},
  pages        = {1909--1917},
  year         = {2010},
  url          = {https://doi.org/10.1587/transinf.E93.D.1909},
  doi          = {10.1587/TRANSINF.E93.D.1909},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/NakamuraTSS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/DoiNTSS10,
  author       = {Hironori Doi and
                  Keigo Nakamura and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Esophageal Speech Enhancement Based on Statistical Voice Conversion
                  with Gaussian Mixture Models},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {93-D},
  number       = {9},
  pages        = {2472--2482},
  year         = {2010},
  url          = {https://doi.org/10.1587/transinf.E93.D.2472},
  doi          = {10.1587/TRANSINF.E93.D.2472},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/DoiNTSS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/OhtaniTSS10a,
  author       = {Yamato Ohtani and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Improvements of the One-to-Many Eigenvoice Conversion System},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {93-D},
  number       = {9},
  pages        = {2491--2499},
  year         = {2010},
  url          = {https://doi.org/10.1587/transinf.E93.D.2491},
  doi          = {10.1587/TRANSINF.E93.D.2491},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/OhtaniTSS10a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cogip/IshikawaSTSK10,
  author       = {Yohei Ishikawa and
                  Hiroshi Saruwatari and
                  Yu Takahashi and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  title        = {Musical noise controllable algorithm of channelwise spectral subtraction
                  and beamforming based on higher-order statistics criterion},
  booktitle    = {2nd International Workshop on Cognitive Information Processing, {CIP}
                  2010, Elba, Italy, 14-16 June, 2010},
  pages        = {81--86},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/CIP.2010.5604226},
  doi          = {10.1109/CIP.2010.5604226},
  timestamp    = {Wed, 16 Oct 2019 14:14:48 +0200},
  biburl       = {https://dblp.org/rec/conf/cogip/IshikawaSTSK10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/InoueTSSK10,
  author       = {Takayuki Inoue and
                  Yu Takahashi and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  title        = {Theoretical analysis of musical noise in generalized spectral subtraction:
                  Why should not use power/amplitude subtraction?},
  booktitle    = {18th European Signal Processing Conference, {EUSIPCO} 2010, Aalborg,
                  Denmark, August 23-27, 2010},
  pages        = {994--998},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://ieeexplore.ieee.org/document/7096577/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/InoueTSSK10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/EvenSST10,
  author       = {Jani Even and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Tomoya Takatani},
  title        = {Blind signal extraction based joint suppression of diffuse background
                  noise and late reverberation},
  booktitle    = {18th European Signal Processing Conference, {EUSIPCO} 2010, Aalborg,
                  Denmark, August 23-27, 2010},
  pages        = {1534--1538},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://ieeexplore.ieee.org/document/7096554/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/EvenSST10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ica/SaruwatariOTS10,
  author       = {Hiroshi Saruwatari and
                  Ryoi Okamoto and
                  Yu Takahashi and
                  Kiyohiro Shikano},
  editor       = {Vincent Vigneron and
                  Vicente Zarzoso and
                  Eric Moreau and
                  R{\'{e}}mi Gribonval and
                  Emmanuel Vincent},
  title        = {Blind Speech Extraction Combining Generalized {MMSE} {STSA} Estimator
                  and ICA-Based Noise and Speech Probability Density Function Estimations},
  booktitle    = {Latent Variable Analysis and Signal Separation - 9th International
                  Conference, {LVA/ICA} 2010, St. Malo, France, September 27-30, 2010.
                  Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {6365},
  pages        = {49--56},
  publisher    = {Springer},
  year         = {2010},
  url          = {https://doi.org/10.1007/978-3-642-15995-4\_7},
  doi          = {10.1007/978-3-642-15995-4\_7},
  timestamp    = {Mon, 05 Feb 2024 20:32:12 +0100},
  biburl       = {https://dblp.org/rec/conf/ica/SaruwatariOTS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TakahashiSSK10,
  author       = {Yu Takahashi and
                  Hiroshi Saruwatari and
                  Hiroshi Shikano and
                  Kazunobu Kondo},
  title        = {Theoretical musical-noise analysis and its generalization for methods
                  of integrating beamforming and spectral subtraction based on higher-order
                  statistics},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {93--96},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5496173},
  doi          = {10.1109/ICASSP.2010.5496173},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/TakahashiSSK10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/EvenSST10,
  author       = {Jani Even and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Tomoya Takatani},
  title        = {Complex Newton algorithm for blind signal extraction of speech in
                  diffuse noise},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {213--216},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5496023},
  doi          = {10.1109/ICASSP.2010.5496023},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/EvenSST10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/DoiNTSS10,
  author       = {Hironori Doi and
                  Keigo Nakamura and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Statistical approach to enhancing esophageal speech based on Gaussian
                  mixture models},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {4250--4253},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495676},
  doi          = {10.1109/ICASSP.2010.5495676},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/DoiNTSS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/EvenSST10a,
  author       = {Jani Even and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Tomoya Takatani},
  title        = {Speech enhancement in presence of diffuse background noise: Why using
                  blind signal extraction?},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {4770--4773},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495160},
  doi          = {10.1109/ICASSP.2010.5495160},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/EvenSST10a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/OkamotoTSS10,
  author       = {Ryoi Okamoto and
                  Yu Takahashi and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {{MMSE} {STSA} estimator with nonstationary noise estimation based
                  on {ICA} for high-quality speech enhancement},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {4778--4781},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495162},
  doi          = {10.1109/ICASSP.2010.5495162},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/OkamotoTSS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/OhtaniTSS10,
  author       = {Yamato Ohtani and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Non-parallel training for many-to-many eigenvoice conversion},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {4822--4825},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495139},
  doi          = {10.1109/ICASSP.2010.5495139},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/OhtaniTSS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/EvenISH10,
  author       = {Jani Even and
                  Carlos Toshinori Ishi and
                  Hiroshi Saruwatari and
                  Norihiro Hagita},
  editor       = {Takao Kobayashi and
                  Keikichi Hirose and
                  Satoshi Nakamura},
  title        = {Close speaker cancellation for suppression of non-stationary background
                  noise for hands-free speech interface},
  booktitle    = {{INTERSPEECH} 2010, 11th Annual Conference of the International Speech
                  Communication Association, Makuhari, Chiba, Japan, September 26-30,
                  2010},
  pages        = {977--980},
  publisher    = {{ISCA}},
  year         = {2010},
  url          = {https://doi.org/10.21437/Interspeech.2010-326},
  doi          = {10.21437/INTERSPEECH.2010-326},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/EvenISH10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/TorresTKMSS10,
  author       = {Rafael Torres and
                  Shota Takeuchi and
                  Hiromichi Kawanami and
                  Tomoko Matsui and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Takao Kobayashi and
                  Keikichi Hirose and
                  Satoshi Nakamura},
  title        = {Comparison of methods for topic classification in a speech-oriented
                  guidance system},
  booktitle    = {{INTERSPEECH} 2010, 11th Annual Conference of the International Speech
                  Communication Association, Makuhari, Chiba, Japan, September 26-30,
                  2010},
  pages        = {1261--1264},
  publisher    = {{ISCA}},
  year         = {2010},
  url          = {https://doi.org/10.21437/Interspeech.2010-397},
  doi          = {10.21437/INTERSPEECH.2010-397},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/TorresTKMSS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/NakamuraTSS10,
  author       = {Keigo Nakamura and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Takao Kobayashi and
                  Keikichi Hirose and
                  Satoshi Nakamura},
  title        = {The use of air-pressure sensor in electrolaryngeal speech enhancement
                  based on statistical voice conversion},
  booktitle    = {{INTERSPEECH} 2010, 11th Annual Conference of the International Speech
                  Communication Association, Makuhari, Chiba, Japan, September 26-30,
                  2010},
  pages        = {1628--1631},
  publisher    = {{ISCA}},
  year         = {2010},
  url          = {https://doi.org/10.21437/Interspeech.2010-471},
  doi          = {10.21437/INTERSPEECH.2010-471},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/NakamuraTSS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/OhtaTOSS10,
  author       = {Kumi Ohta and
                  Tomoki Toda and
                  Yamato Ohtani and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Takao Kobayashi and
                  Keikichi Hirose and
                  Satoshi Nakamura},
  title        = {Adaptive voice-quality control based on one-to-many eigenvoice conversion},
  booktitle    = {{INTERSPEECH} 2010, 11th Annual Conference of the International Speech
                  Communication Association, Makuhari, Chiba, Japan, September 26-30,
                  2010},
  pages        = {2158--2161},
  publisher    = {{ISCA}},
  year         = {2010},
  url          = {https://doi.org/10.21437/Interspeech.2010-595},
  doi          = {10.21437/INTERSPEECH.2010-595},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/OhtaTOSS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/SawadaESST10,
  author       = {Hiroshi Sawada and
                  Jani Even and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Tomoya Takatani},
  title        = {Improvement of speech recognition performance for spoken-oriented
                  robot dialog system using end-fire array},
  booktitle    = {2010 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, October 18-22, 2010, Taipei, Taiwan},
  pages        = {970--975},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/IROS.2010.5648924},
  doi          = {10.1109/IROS.2010.5648924},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/SawadaESST10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/HayashidaTOSS10,
  author       = {Chie Hayashida and
                  Tomoki Toda and
                  Yamato Ohtani and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Yoshinori Sagisaka and
                  Keiichi Tokuda},
  title        = {Linear transformation approaches to many-to-one voice conversion},
  booktitle    = {The Seventh {ISCA} Tutorial and Research Workshop on Speech Synthesis,
                  Kyoto, Japan, September 22-24, 2010},
  pages        = {74--79},
  publisher    = {{ISCA}},
  year         = {2010},
  url          = {http://www.isca-speech.org/archive/ssw7/ssw7\_074.html},
  timestamp    = {Tue, 16 Nov 2021 11:36:19 +0100},
  biburl       = {https://dblp.org/rec/conf/ssw/HayashidaTOSS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/dsp/PrasadSS09,
  author       = {Rajkishore Prasad and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Enhancement of speech signals separated from their convolutive mixture
                  by {FDICA} algorithm},
  journal      = {Digit. Signal Process.},
  volume       = {19},
  number       = {1},
  pages        = {127--133},
  year         = {2009},
  url          = {https://doi.org/10.1016/j.dsp.2008.01.007},
  doi          = {10.1016/J.DSP.2008.01.007},
  timestamp    = {Thu, 20 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/dsp/PrasadSS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/speech/GomezTSS09,
  author       = {Randy Gomez and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Techniques in rapid unsupervised speaker adaptation based on HMM-Sufficient
                  Statistics},
  journal      = {Speech Commun.},
  volume       = {51},
  number       = {1},
  pages        = {42--57},
  year         = {2009},
  url          = {https://doi.org/10.1016/j.specom.2008.05.014},
  doi          = {10.1016/J.SPECOM.2008.05.014},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/speech/GomezTSS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/TakahashiTOSS09,
  author       = {Yu Takahashi and
                  Tomoya Takatani and
                  Keiichi Osako and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Blind Spatial Subtraction Array for Speech Enhancement in Noisy Environment},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {17},
  number       = {4},
  pages        = {650--664},
  year         = {2009},
  url          = {https://doi.org/10.1109/TASL.2008.2011517},
  doi          = {10.1109/TASL.2008.2011517},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/TakahashiTOSS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/EvenSS09,
  author       = {Jani Even and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Enhanced wiener post-processing based on partial projection back of
                  the blind signal separation noise estimate},
  booktitle    = {17th European Signal Processing Conference, {EUSIPCO} 2009, Glasgow,
                  Scotland, UK, August 24-28, 2009},
  pages        = {1442--1446},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://ieeexplore.ieee.org/document/7077808/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/EvenSS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HiekataMIHZTSS09,
  author       = {Takashi Hiekata and
                  Takashi Morita and
                  Youhei Ikeda and
                  Hiroshi Hashimoto and
                  Ruoyu Zhang and
                  Yu Takahashi and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Multiple ICA-based real-time blind source extraction applied to handy
                  size microphone},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
  pages        = {121--124},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICASSP.2009.4959535},
  doi          = {10.1109/ICASSP.2009.4959535},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/HiekataMIHZTSS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TakahashiUSSK09,
  author       = {Yu Takahashi and
                  Yoshihisa Uemura and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  title        = {Musical noise analysis based on higher order statistics for microphone
                  array and nonlinear signal processing},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
  pages        = {229--232},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICASSP.2009.4959562},
  doi          = {10.1109/ICASSP.2009.4959562},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/TakahashiUSSK09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MiyabeJSS09,
  author       = {Shigeki Miyabe and
                  Biing{-}Hwang Juang and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Kernel-based nonlinear independent component analysis for underdetermined
                  blind source separation},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
  pages        = {1641--1644},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICASSP.2009.4959915},
  doi          = {10.1109/ICASSP.2009.4959915},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/MiyabeJSS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TakahashiSFTMMST09,
  author       = {Yu Takahashi and
                  Hiroshi Saruwatari and
                  Yuki Fujihara and
                  Kentaro Tachibana and
                  Yoshimitsu Mori and
                  Shigeki Miyabe and
                  Kiyohiro Shikano and
                  Akira Tanaka},
  title        = {Source adaptive blind signal extraction using closed-form {ICA} for
                  hands-free robot spoken dialogue system},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
  pages        = {3681--3684},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICASSP.2009.4960425},
  doi          = {10.1109/ICASSP.2009.4960425},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/TakahashiSFTMMST09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SaruwatariKTTCS09,
  author       = {Hiroshi Saruwatari and
                  Hiromichi Kawanami and
                  Shota Takeuchi and
                  Yu Takahashi and
                  Tobias Cincarek and
                  Kiyohiro Shikano},
  title        = {Hands-free speech recognition challenge for real-world speech dialogue
                  systems},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
  pages        = {3729--3732},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICASSP.2009.4960437},
  doi          = {10.1109/ICASSP.2009.4960437},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/SaruwatariKTTCS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MiyamotoNTSS09,
  author       = {Daisuke Miyamoto and
                  Keigo Nakamura and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Acoustic compensation methods for body transmitted speech conversion},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
  pages        = {3901--3904},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICASSP.2009.4960480},
  doi          = {10.1109/ICASSP.2009.4960480},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/MiyamotoNTSS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/UemuraTSSK09,
  author       = {Yoshihisa Uemura and
                  Yu Takahashi and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Kazunobu Kondo},
  title        = {Musical noise generation analysis for noise reduction methods based
                  on spectral subtraction and {MMSE} {STSA} estimation},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
  pages        = {4433--4436},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICASSP.2009.4960613},
  doi          = {10.1109/ICASSP.2009.4960613},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/UemuraTSSK09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ida/EvenSS09,
  author       = {Jani Even and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {T{\"{u}}lay Adali and
                  Christian Jutten and
                  Jo{\~{a}}o Marcos Travassos Romano and
                  Allan Kardec Barros},
  title        = {Target Speech Enhancement in Presence of Jammer and Diffuse Background
                  Noise},
  booktitle    = {Independent Component Analysis and Signal Separation, 8th International
                  Conference, {ICA} 2009, Paraty, Brazil, March 15-18, 2009. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5441},
  pages        = {565--572},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-00599-2\_71},
  doi          = {10.1007/978-3-642-00599-2\_71},
  timestamp    = {Tue, 14 May 2019 10:00:49 +0200},
  biburl       = {https://dblp.org/rec/conf/ida/EvenSS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/NakamuraTSS09,
  author       = {Keigo Nakamura and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Electrolaryngeal speech enhancement based on statistical voice conversion},
  booktitle    = {{INTERSPEECH} 2009, 10th Annual Conference of the International Speech
                  Communication Association, Brighton, United Kingdom, September 6-10,
                  2009},
  pages        = {1431--1434},
  publisher    = {{ISCA}},
  year         = {2009},
  url          = {https://doi.org/10.21437/Interspeech.2009-439},
  doi          = {10.21437/INTERSPEECH.2009-439},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/NakamuraTSS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/OhtaniTSS09,
  author       = {Yamato Ohtani and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Many-to-many eigenvoice conversion with reference voice},
  booktitle    = {{INTERSPEECH} 2009, 10th Annual Conference of the International Speech
                  Communication Association, Brighton, United Kingdom, September 6-10,
                  2009},
  pages        = {1623--1626},
  publisher    = {{ISCA}},
  year         = {2009},
  url          = {https://doi.org/10.21437/Interspeech.2009-485},
  doi          = {10.21437/INTERSPEECH.2009-485},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/OhtaniTSS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/EvenSSST09,
  author       = {Jani Even and
                  Hiroshi Sawada and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Tomoya Takatani},
  title        = {Semi-blind suppression of internal noise for hands-free robot spoken
                  dialog system},
  booktitle    = {2009 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, October 11-15, 2009, St. Louis, MO, {USA}},
  pages        = {658--663},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/IROS.2009.5354451},
  doi          = {10.1109/IROS.2009.5354451},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/EvenSSST09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/waspaa/MiyabeMSSN09,
  author       = {Shigeki Miyabe and
                  Keisuke Masatoki and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Toshiyuki Nomura},
  title        = {Temporal quantization of spatial information using directional clustering
                  for multichannel audio coding},
  booktitle    = {{IEEE} Workshop on Applications of Signal Processing to Audio and
                  Acoustics, {WASPAA} '09, New Paltz, NY, USA, October 18-21, 2009},
  pages        = {261--264},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ASPAA.2009.5346519},
  doi          = {10.1109/ASPAA.2009.5346519},
  timestamp    = {Wed, 16 Oct 2019 14:14:57 +0200},
  biburl       = {https://dblp.org/rec/conf/waspaa/MiyabeMSSN09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/CincarekTSS08,
  author       = {Tobias Cincarek and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Cost Reduction of Acoustic Modeling for Real-Environment Applications
                  Using Unsupervised and Selective Training},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {91-D},
  number       = {3},
  pages        = {499--507},
  year         = {2008},
  url          = {https://doi.org/10.1093/ietisy/e91-d.3.499},
  doi          = {10.1093/IETISY/E91-D.3.499},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/CincarekTSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/CincarekKNLSS08,
  author       = {Tobias Cincarek and
                  Hiromichi Kawanami and
                  Ryuichi Nisimura and
                  Akinobu Lee and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Development, Long-Term Operation and Portability of a Real-Environment
                  Speech-Oriented Guidance System},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {91-D},
  number       = {3},
  pages        = {576--587},
  year         = {2008},
  url          = {https://doi.org/10.1093/ietisy/e91-d.3.576},
  doi          = {10.1093/IETISY/E91-D.3.576},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/CincarekKNLSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/NaginoSTSS08,
  author       = {Goshu Nagino and
                  Makoto Shozakai and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Building an Effective Speech Corpus by Utilizing Statistical Multidimensional
                  Scaling Method},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {91-D},
  number       = {3},
  pages        = {607--614},
  year         = {2008},
  url          = {https://doi.org/10.1093/ietisy/e91-d.3.607},
  doi          = {10.1093/IETISY/E91-D.3.607},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/NaginoSTSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/YaiMSST08,
  author       = {Yuki Yai and
                  Shigeki Miyabe and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Yosuke Tatekura},
  title        = {Rapid Compensation of Temperature Fluctuation Effect for Multichannel
                  Sound Field Reproduction System},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {91-A},
  number       = {6},
  pages        = {1329--1336},
  year         = {2008},
  url          = {https://doi.org/10.1093/ietfec/e91-a.6.1329},
  doi          = {10.1093/IETFEC/E91-A.6.1329},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/YaiMSST08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/OsakoMTSS08,
  author       = {Keiichi Osako and
                  Yoshimitsu Mori and
                  Yu Takahashi and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Fast Convergence Blind Source Separation Using Frequency Subband Interpolation
                  by Null Beamforming},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {91-A},
  number       = {6},
  pages        = {1357--1361},
  year         = {2008},
  url          = {https://doi.org/10.1093/ietfec/e91-a.6.1357},
  doi          = {10.1093/IETFEC/E91-A.6.1357},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ieicet/OsakoMTSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/EvenSS08,
  author       = {Jani Even and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Extension of score function difference for frequency domain blind
                  source separation},
  booktitle    = {2008 16th European Signal Processing Conference, {EUSIPCO} 2008, Lausanne,
                  Switzerland, August 25-29, 2008},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://ieeexplore.ieee.org/document/7080564/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/EvenSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/EvenSS08,
  author       = {Jani Even and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Frequency domain semi-blind signal separation: application to the
                  rejection of internal noises},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2008, March 30 - April 4, 2008, Caesars
                  Palace, Las Vegas, Nevada, {USA}},
  pages        = {157--160},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ICASSP.2008.4517570},
  doi          = {10.1109/ICASSP.2008.4517570},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/EvenSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HaraguchiMSSN08,
  author       = {Yuuki Haraguchi and
                  Shigeki Miyabe and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Toshiyuki Nomura},
  title        = {Source-oriented localization control of stereo audio signals based
                  on blind source separation},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2008, March 30 - April 4, 2008, Caesars
                  Palace, Las Vegas, Nevada, {USA}},
  pages        = {177--180},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ICASSP.2008.4517575},
  doi          = {10.1109/ICASSP.2008.4517575},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/HaraguchiMSSN08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/YuyamaMSS08,
  author       = {Yuuta Yuyama and
                  Shigeki Miyabe and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Hybrid structure of inverse filtering and DOA-parameterized wavefront
                  synthesis},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2008, March 30 - April 4, 2008, Caesars
                  Palace, Las Vegas, Nevada, {USA}},
  pages        = {401--404},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ICASSP.2008.4517631},
  doi          = {10.1109/ICASSP.2008.4517631},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/YuyamaMSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/GomezESS08,
  author       = {Randy Gomez and
                  Jani Even and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Distant talking robust speech recognition using late reflection components
                  of room impulse response},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2008, March 30 - April 4, 2008, Caesars
                  Palace, Las Vegas, Nevada, {USA}},
  pages        = {4581--4584},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ICASSP.2008.4518676},
  doi          = {10.1109/ICASSP.2008.4518676},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/GomezESS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/TakeuchiCKSS08,
  author       = {Shota Takeuchi and
                  Tobias Cincarek and
                  Hiromichi Kawanami and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Question and answer database optimization using speech recognition
                  results},
  booktitle    = {{INTERSPEECH} 2008, 9th Annual Conference of the International Speech
                  Communication Association, Brisbane, Australia, September 22-26, 2008},
  pages        = {451--454},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-73},
  doi          = {10.21437/INTERSPEECH.2008-73},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/TakeuchiCKSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SaruwatariTSTCKS08,
  author       = {Hiroshi Saruwatari and
                  Yu Takahashi and
                  Hiroyuki Sakai and
                  Shota Takeuchi and
                  Tobias Cincarek and
                  Hiromichi Kawanami and
                  Kiyohiro Shikano},
  title        = {Development and evaluation of hands-free spoken dialogue system for
                  railway station guidance},
  booktitle    = {{INTERSPEECH} 2008, 9th Annual Conference of the International Speech
                  Communication Association, Brisbane, Australia, September 22-26, 2008},
  pages        = {455--458},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-74},
  doi          = {10.21437/INTERSPEECH.2008-74},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SaruwatariTSTCKS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/MuramatsuOTSS08,
  author       = {Takashi Muramatsu and
                  Yamato Ohtani and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Low-delay voice conversion based on maximum likelihood estimation
                  of spectral parameter trajectory},
  booktitle    = {{INTERSPEECH} 2008, 9th Annual Conference of the International Speech
                  Communication Association, Brisbane, Australia, September 22-26, 2008},
  pages        = {1076--1079},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-332},
  doi          = {10.21437/INTERSPEECH.2008-332},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/MuramatsuOTSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/OhtaniTSS08,
  author       = {Yamato Ohtani and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {An improved one-to-many eigenvoice conversion system},
  booktitle    = {{INTERSPEECH} 2008, 9th Annual Conference of the International Speech
                  Communication Association, Brisbane, Australia, September 22-26, 2008},
  pages        = {1080--1083},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-333},
  doi          = {10.21437/INTERSPEECH.2008-333},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/OhtaniTSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/OkamotoMKSS08,
  author       = {Hideki Okamoto and
                  Tomoko Matsui and
                  Hiromichi Kawanami and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Speaker verification with non-audible murmur segments by combining
                  global alignment kernel and penalized logistic regression machine},
  booktitle    = {{INTERSPEECH} 2008, 9th Annual Conference of the International Speech
                  Communication Association, Brisbane, Australia, September 22-26, 2008},
  pages        = {1369--1372},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-398},
  doi          = {10.21437/INTERSPEECH.2008-398},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/OkamotoMKSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/TaniTOSS08,
  author       = {Daisuke Tani and
                  Tomoki Toda and
                  Yamato Ohtani and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Maximum a posteriori adaptation for many-to-one eigenvoice conversion},
  booktitle    = {{INTERSPEECH} 2008, 9th Annual Conference of the International Speech
                  Communication Association, Brisbane, Australia, September 22-26, 2008},
  pages        = {1461--1463},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-421},
  doi          = {10.21437/INTERSPEECH.2008-421},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/TaniTOSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/NakamuraTNSS08,
  author       = {Keigo Nakamura and
                  Tomoki Toda and
                  Yoshitaka Nakajima and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Evaluation of speaking-aid system with voice conversion for laryngectomees
                  toward its use in practical environments},
  booktitle    = {{INTERSPEECH} 2008, 9th Annual Conference of the International Speech
                  Communication Association, Brisbane, Australia, September 22-26, 2008},
  pages        = {2209--2212},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-577},
  doi          = {10.21437/INTERSPEECH.2008-577},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/NakamuraTNSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/TakahashiSS08,
  author       = {Yu Takahashi and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Real-time implementation of blind spatial subtraction array for hands-free
                  robot spoken dialogue system},
  booktitle    = {2008 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, September 22-26, 2008, Acropolis Convention Center, Nice,
                  France},
  pages        = {1687--1692},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/IROS.2008.4651006},
  doi          = {10.1109/IROS.2008.4651006},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/TakahashiSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/EvenSS08,
  author       = {Jani Even and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {An improved permutation solver for blind signal separation based front-ends
                  in robot audition},
  booktitle    = {2008 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, September 22-26, 2008, Acropolis Convention Center, Nice,
                  France},
  pages        = {2172--2177},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/IROS.2008.4650602},
  doi          = {10.1109/IROS.2008.4650602},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/EvenSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/wocci/MiyakeTKSS08,
  author       = {Jumpei Miyake and
                  Shota Takeuchi and
                  Hiromichi Kawanami and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Kay Berkling and
                  Diego Giuliani and
                  Alexandros Potamianos},
  title        = {Language model for the web search task in a spoken dialogue system
                  for children},
  booktitle    = {The 1st Workshop on Child, Computer and Interaction, {WOCCI} 2008,
                  Chania, Crete, Greece, October 23, 2008},
  pages        = {10},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {http://www.isca-speech.org/archive/wocci\_2008/woc8\_10.html},
  timestamp    = {Tue, 16 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/wocci/MiyakeTKSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ejasp/HeracleousKSS07,
  author       = {Panikos Heracleous and
                  Tomomi Kaino and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Unvoiced Speech Recognition Using Tissue-Conductive Acoustic Sensor},
  journal      = {{EURASIP} J. Adv. Signal Process.},
  volume       = {2007},
  year         = {2007},
  url          = {https://doi.org/10.1155/2007/94068},
  doi          = {10.1155/2007/94068},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ejasp/HeracleousKSS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ejasp/MiyabeHSST07,
  author       = {Shigeki Miyabe and
                  Yoichi Hinamoto and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Yosuke Tatekura},
  title        = {Interface for Barge-in Free Spoken Dialogue System Based on Sound
                  Field Reproduction and Microphone Array},
  journal      = {{EURASIP} J. Adv. Signal Process.},
  volume       = {2007},
  year         = {2007},
  url          = {https://doi.org/10.1155/2007/57470},
  doi          = {10.1155/2007/57470},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ejasp/MiyabeHSST07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/GomezTSS07,
  author       = {Randy Gomez and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Reducing Computation Time of the Rapid Unsupervised Speaker Adaptation
                  Based on HMM-Sufficient Statistics},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {90-D},
  number       = {2},
  pages        = {554--561},
  year         = {2007},
  url          = {https://doi.org/10.1093/ietisy/e90-d.2.554},
  doi          = {10.1093/IETISY/E90-D.2.554},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/GomezTSS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/CincarekKSS07,
  author       = {Tobias Cincarek and
                  Hiromichi Kawanami and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Sadaoki Furui and
                  Tatsuya Kawahara},
  title        = {Development and portability of {ASR} and Q{\&}A modules for real-environment
                  speech-oriented guidance systems},
  booktitle    = {{IEEE} Workshop on Automatic Speech Recognition {\&} Understanding,
                  {ASRU} 2007, Kyoto, Japan, December 9-13, 2007},
  pages        = {520--525},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ASRU.2007.4430166},
  doi          = {10.1109/ASRU.2007.4430166},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/asru/CincarekKSS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/MiyabeTSST07,
  author       = {Shigeki Miyabe and
                  Tomoya Takatani and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Yosuke Tatekura},
  title        = {Barge-in- and noise-free spoken dialogue interface based on sound
                  field control and semi-blind source separation},
  booktitle    = {15th European Signal Processing Conference, {EUSIPCO} 2007, Poznan,
                  Poland, September 3-7, 2007},
  pages        = {232--236},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://ieeexplore.ieee.org/document/7098799/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/MiyabeTSST07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TachibanaSMMST07,
  author       = {Kentaro Tachibana and
                  Hiroshi Saruwatari and
                  Yoshimitsu Mori and
                  Shigeki Miyabe and
                  Kiyohiro Shikano and
                  Akira Tanaka},
  title        = {Efficient Blind Source Separation Combining Closed-Form Second-Order
                  {ICA} and Nonclosed-Form Higher-Order {ICA}},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2007, Honolulu, Hawaii, USA, April
                  15-20, 2007},
  pages        = {45--48},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ICASSP.2007.366612},
  doi          = {10.1109/ICASSP.2007.366612},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/TachibanaSMMST07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TakahashiTSS07,
  author       = {Yu Takahashi and
                  Tomoya Takatani and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Permutation-Robust Structure for ICA-Based Blind Source Extraction},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2007, Honolulu, Hawaii, USA, April
                  15-20, 2007},
  pages        = {149--152},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ICASSP.2007.366638},
  doi          = {10.1109/ICASSP.2007.366638},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/TakahashiTSS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MoriTSSHM07,
  author       = {Yoshimitsu Mori and
                  Tomoya Takatani and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Takashi Hiekata and
                  Takashi Morita},
  title        = {High-Presence Hearing-Aid System using DSP-Based Real-Time Blind Source
                  Separation Module},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2007, Honolulu, Hawaii, USA, April
                  15-20, 2007},
  pages        = {609--612},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ICASSP.2007.366986},
  doi          = {10.1109/ICASSP.2007.366986},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MoriTSSHM07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/GomezTSS07,
  author       = {Randy Gomez and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Rapid unsupervised speaker adaptation using single utterance based
                  on {MLLR} and speaker selection},
  booktitle    = {{INTERSPEECH} 2007, 8th Annual Conference of the International Speech
                  Communication Association, Antwerp, Belgium, August 27-31, 2007},
  pages        = {262--265},
  publisher    = {{ISCA}},
  year         = {2007},
  url          = {https://doi.org/10.21437/Interspeech.2007-117},
  doi          = {10.21437/INTERSPEECH.2007-117},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/GomezTSS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/CincarekSTSS07,
  author       = {Tobias Cincarek and
                  Izumi Shindo and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Development of preschool children subsystem for {ASR} and q{\&}a
                  in a real-environment speech-oriented guidance task},
  booktitle    = {{INTERSPEECH} 2007, 8th Annual Conference of the International Speech
                  Communication Association, Antwerp, Belgium, August 27-31, 2007},
  pages        = {1469--1472},
  publisher    = {{ISCA}},
  year         = {2007},
  url          = {https://doi.org/10.21437/Interspeech.2007-426},
  doi          = {10.21437/INTERSPEECH.2007-426},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/CincarekSTSS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/OhtaniTSS07,
  author       = {Yamato Ohtani and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Speaker adaptive training for one-to-many eigenvoice conversion based
                  on Gaussian mixture model},
  booktitle    = {{INTERSPEECH} 2007, 8th Annual Conference of the International Speech
                  Communication Association, Antwerp, Belgium, August 27-31, 2007},
  pages        = {1981--1984},
  publisher    = {{ISCA}},
  year         = {2007},
  url          = {https://doi.org/10.21437/Interspeech.2007-554},
  doi          = {10.21437/INTERSPEECH.2007-554},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/OhtaniTSS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/OkamotoKMKSS07,
  author       = {Hideki Okamoto and
                  Mariko Kojima and
                  Tomoko Matsui and
                  Hiromichi Kawanami and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Study on speaker verification with non-audible murmur segments},
  booktitle    = {{INTERSPEECH} 2007, 8th Annual Conference of the International Speech
                  Communication Association, Antwerp, Belgium, August 27-31, 2007},
  pages        = {2017--2020},
  publisher    = {{ISCA}},
  year         = {2007},
  url          = {https://doi.org/10.21437/Interspeech.2007-164},
  doi          = {10.21437/INTERSPEECH.2007-164},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/OkamotoKMKSS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/NakamuraTSS07,
  author       = {Keigo Nakamura and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Impact of various small sound source signals on voice conversion accuracy
                  in speech communication aid for laryngectomees},
  booktitle    = {{INTERSPEECH} 2007, 8th Annual Conference of the International Speech
                  Communication Association, Antwerp, Belgium, August 27-31, 2007},
  pages        = {2517--2520},
  publisher    = {{ISCA}},
  year         = {2007},
  url          = {https://doi.org/10.21437/Interspeech.2007-669},
  doi          = {10.21437/INTERSPEECH.2007-669},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/NakamuraTSS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isspa/MoriTSSHM07,
  author       = {Yoshimitsu Mori and
                  Tomoya Takatani and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Takashi Hiekata and
                  Takashi Morita},
  title        = {Noise-robust hands-free speech recognition using SIMO-model-based
                  blind source separation},
  booktitle    = {9th International Symposium on Signal Processing and Its Applications,
                  {ISSPA} 2007, Sharjah, United Arab Emirates, February 12-15, 2007},
  pages        = {1--4},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ISSPA.2007.4555597},
  doi          = {10.1109/ISSPA.2007.4555597},
  timestamp    = {Wed, 16 Oct 2019 14:14:56 +0200},
  biburl       = {https://dblp.org/rec/conf/isspa/MoriTSSHM07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isspa/TakahashiTSS07,
  author       = {Yu Takahashi and
                  Tomoya Takatani and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Robust spatial subtraction array with independent component analysis
                  for speech enhancement},
  booktitle    = {9th International Symposium on Signal Processing and Its Applications,
                  {ISSPA} 2007, Sharjah, United Arab Emirates, February 12-15, 2007},
  pages        = {1--4},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ISSPA.2007.4555589},
  doi          = {10.1109/ISSPA.2007.4555589},
  timestamp    = {Fri, 26 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/isspa/TakahashiTSS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocomm/SakaiCKSSL07,
  author       = {Hiroyuki Sakai and
                  Tobias Cincarek and
                  Hiromichi Kawanami and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Akinobu Lee},
  editor       = {Alan F. T. Winfield and
                  Jason Redi},
  title        = {Voice activity detection applied to hands-free spoken dialogue robot
                  based on decoding using acoustic and language model},
  booktitle    = {Proceedings of the 1st International Conference on Robot Communication
                  and Coordination, {ROBOCOMM} 2007, Athens, Greece, October 15-17,
                  2007},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {318},
  pages        = {16},
  publisher    = {{ICST/ACM}},
  year         = {2007},
  url          = {https://doi.org/10.4108/ICST.ROBOCOMM2007.2088},
  doi          = {10.4108/ICST.ROBOCOMM2007.2088},
  timestamp    = {Tue, 27 Nov 2018 10:40:37 +0100},
  biburl       = {https://dblp.org/rec/conf/robocomm/SakaiCKSSL07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/OhtaOTSS07,
  author       = {Kumi Ohta and
                  Yamato Ohtani and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Petra Wagner and
                  Julia Abresch and
                  Stefan Breuer and
                  Wolfgang Hess},
  title        = {Regression approaches to voice quality controll based on one-to-many
                  eigenvoice conversion},
  booktitle    = {Sixth {ISCA} Workshop on Speech Synthesis, Bonn, Germany, August 22-24,
                  2007},
  pages        = {101--106},
  publisher    = {{ISCA}},
  year         = {2007},
  url          = {http://www.isca-speech.org/archive\_open/ssw6/ssw6\_101.html},
  timestamp    = {Mon, 04 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ssw/OhtaOTSS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/TaniOTSS07,
  author       = {Daisuke Tani and
                  Yamato Ohtani and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Petra Wagner and
                  Julia Abresch and
                  Stefan Breuer and
                  Wolfgang Hess},
  title        = {An evaluation of many-to-one voice conversion algorithms with pre-stored
                  speaker data sets},
  booktitle    = {Sixth {ISCA} Workshop on Speech Synthesis, Bonn, Germany, August 22-24,
                  2007},
  pages        = {107--112},
  publisher    = {{ISCA}},
  year         = {2007},
  url          = {http://www.isca-speech.org/archive\_open/ssw6/ssw6\_107.html},
  timestamp    = {Mon, 04 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ssw/TaniOTSS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/sp/07/SaruwatariTS07,
  author       = {Hiroshi Saruwatari and
                  Tomoya Takatani and
                  Kiyohiro Shikano},
  editor       = {Shoji Makino and
                  Hiroshi Sawada and
                  Te{-}Won Lee},
  title        = {SIMO-Model-Based Blind Source Separation - Principle and its Applications},
  booktitle    = {Blind Speech Separation},
  series       = {Signals and Communication Technology},
  pages        = {149--168},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-1-4020-6479-1\_5},
  doi          = {10.1007/978-1-4020-6479-1\_5},
  timestamp    = {Fri, 12 Jul 2019 10:51:30 +0200},
  biburl       = {https://dblp.org/rec/books/sp/07/SaruwatariTS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ejasp/MoriSTUSHIHM06,
  author       = {Yoshimitsu Mori and
                  Hiroshi Saruwatari and
                  Tomoya Takatani and
                  Satoshi Ukai and
                  Kiyohiro Shikano and
                  Takashi Hiekata and
                  Youhei Ikeda and
                  Hiroshi Hashimoto and
                  Takashi Morita},
  title        = {Blind Separation of Acoustic Signals Combining SIMO-Model-Based Independent
                  Component Analysis and Binary Masking},
  journal      = {{EURASIP} J. Adv. Signal Process.},
  volume       = {2006},
  year         = {2006},
  url          = {https://doi.org/10.1155/ASP/2006/34970},
  doi          = {10.1155/ASP/2006/34970},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ejasp/MoriSTUSHIHM06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/MiyabeSST06,
  author       = {Shigeki Miyabe and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Yosuke Tatekura},
  title        = {Interface for Barge-in Free Spoken Dialogue System Using Nullspace
                  Based Sound Field Control and Beamforming},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {89-A},
  number       = {3},
  pages        = {716--726},
  year         = {2006},
  url          = {https://doi.org/10.1093/ietfec/e89-a.3.716},
  doi          = {10.1093/IETFEC/E89-A.3.716},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/MiyabeSST06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/CincarekTSS06,
  author       = {Tobias Cincarek and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Utterance-Based Selective Training for the Automatic Creation of Task-Dependent
                  Acoustic Models},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {89-D},
  number       = {3},
  pages        = {962--969},
  year         = {2006},
  url          = {https://doi.org/10.1093/ietisy/e89-d.3.962},
  doi          = {10.1093/IETISY/E89-D.3.962},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/CincarekTSS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/GomezLTSS06,
  author       = {Randy Gomez and
                  Akinobu Lee and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Improving Rapid Unsupervised Speaker Adaptation Based on HMM-Sufficient
                  Statistics in Noisy Environments Using Multi-Template Models},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {89-D},
  number       = {3},
  pages        = {998--1005},
  year         = {2006},
  url          = {https://doi.org/10.1093/ietisy/e89-d.3.998},
  doi          = {10.1093/IETISY/E89-D.3.998},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/GomezLTSS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/SaruwatariKNLS06,
  author       = {Hiroshi Saruwatari and
                  Toshiya Kawamura and
                  Tsuyoki Nishikawa and
                  Akinobu Lee and
                  Kiyohiro Shikano},
  title        = {Blind source separation based on a fast-convergence algorithm combining
                  {ICA} and beamforming},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {14},
  number       = {2},
  pages        = {666--678},
  year         = {2006},
  url          = {https://doi.org/10.1109/TSA.2005.855832},
  doi          = {10.1109/TSA.2005.855832},
  timestamp    = {Sun, 17 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/SaruwatariKNLS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/MoriTSSHM06,
  author       = {Yoshimitsu Mori and
                  Tomoya Takatani and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Takashi Hiekata and
                  Takashi Morita},
  title        = {Two-stage blind separation of moving sound sources with pocket-size
                  real-time {DSP} module},
  booktitle    = {14th European Signal Processing Conference, {EUSIPCO} 2006, Florence,
                  Italy, September 4-8, 2006},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://ieeexplore.ieee.org/document/7071689/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/MoriTSSHM06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ica/MoriSTSHM06,
  author       = {Yoshimitsu Mori and
                  Hiroshi Saruwatari and
                  Tomoya Takatani and
                  Kiyohiro Shikano and
                  Takashi Hiekata and
                  Takashi Morita},
  editor       = {Justinian P. Rosca and
                  Deniz Erdogmus and
                  Jos{\'{e}} Carlos Pr{\'{\i}}ncipe and
                  Simon Haykin},
  title        = {{ICA} and Binary-Mask-Based Blind Source Separation with Small Directional
                  Microphones},
  booktitle    = {Independent Component Analysis and Blind Signal Separation, 6th International
                  Conference, {ICA} 2006, Charleston, SC, USA, March 5-8, 2006, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {3889},
  pages        = {649--657},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/11679363\_81},
  doi          = {10.1007/11679363\_81},
  timestamp    = {Wed, 03 Mar 2021 09:19:59 +0100},
  biburl       = {https://dblp.org/rec/conf/ica/MoriSTSHM06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MoriTSHM06,
  author       = {Yoshimitsu Mori and
                  Tomoya Takatani and
                  Hiroshi Saruwatari and
                  Takashi Hiekata and
                  Takashi Morita},
  title        = {Blind Source Separation Combining Simo-Ica and Simo-Model-Based Binary
                  Masking},
  booktitle    = {2006 {IEEE} International Conference on Acoustics Speech and Signal
                  Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
  pages        = {81--84},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/ICASSP.2006.1661217},
  doi          = {10.1109/ICASSP.2006.1661217},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MoriTSHM06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MiyabeTMSST06,
  author       = {Shigeki Miyabe and
                  Tomoya Takatani and
                  Yoshimitsu Mori and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Yosuke Tatekura},
  title        = {Double-Talk Free Spoken Dialogue Interface Combining Sound Field Control
                  With Semi-Blind Source Separation},
  booktitle    = {2006 {IEEE} International Conference on Acoustics Speech and Signal
                  Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
  pages        = {809--812},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/ICASSP.2006.1660144},
  doi          = {10.1109/ICASSP.2006.1660144},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MiyabeTMSST06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/GomezTSS06,
  author       = {Randy Gomez and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Improving Rapid Unsupervised Speaker Adaptation Based On Hmm Sufficient
                  Statistics},
  booktitle    = {2006 {IEEE} International Conference on Acoustics Speech and Signal
                  Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
  pages        = {1001--1004},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/ICASSP.2006.1660192},
  doi          = {10.1109/ICASSP.2006.1660192},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/GomezTSS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/CincarekTSS06,
  author       = {Tobias Cincarek and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Acoustic modeling for spoken dialogue systems based on unsupervised
                  utterance-based selective training},
  booktitle    = {{INTERSPEECH} 2006 - ICSLP, Ninth International Conference on Spoken
                  Language Processing, Pittsburgh, PA, USA, September 17-21, 2006},
  publisher    = {{ISCA}},
  year         = {2006},
  url          = {https://doi.org/10.21437/Interspeech.2006-478},
  doi          = {10.21437/INTERSPEECH.2006-478},
  timestamp    = {Thu, 22 Jun 2023 16:42:16 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/CincarekTSS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/KojimaMKSS06,
  author       = {Mariko Kojima and
                  Tomoko Matsui and
                  Hiromichi Kawanami and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Speaker verification with non-audible murmur segments},
  booktitle    = {{INTERSPEECH} 2006 - ICSLP, Ninth International Conference on Spoken
                  Language Processing, Pittsburgh, PA, USA, September 17-21, 2006},
  publisher    = {{ISCA}},
  year         = {2006},
  url          = {https://doi.org/10.21437/Interspeech.2006-194},
  doi          = {10.21437/INTERSPEECH.2006-194},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/KojimaMKSS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/NakamuraTSS06,
  author       = {Keigo Nakamura and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Speaking aid system for total laryngectomees using voice conversion
                  of body transmitted artificial speech},
  booktitle    = {{INTERSPEECH} 2006 - ICSLP, Ninth International Conference on Spoken
                  Language Processing, Pittsburgh, PA, USA, September 17-21, 2006},
  publisher    = {{ISCA}},
  year         = {2006},
  url          = {https://doi.org/10.21437/Interspeech.2006-419},
  doi          = {10.21437/INTERSPEECH.2006-419},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/NakamuraTSS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/OhtaniTSS06,
  author       = {Yamato Ohtani and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Maximum likelihood voice conversion based on {GMM} with {STRAIGHT}
                  mixed excitation},
  booktitle    = {{INTERSPEECH} 2006 - ICSLP, Ninth International Conference on Spoken
                  Language Processing, Pittsburgh, PA, USA, September 17-21, 2006},
  publisher    = {{ISCA}},
  year         = {2006},
  url          = {https://doi.org/10.21437/Interspeech.2006-582},
  doi          = {10.21437/INTERSPEECH.2006-582},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/OhtaniTSS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lrec/KatoTSS06,
  author       = {Tomoyuki Kato and
                  Tomiki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Nicoletta Calzolari and
                  Khalid Choukri and
                  Aldo Gangemi and
                  Bente Maegaard and
                  Joseph Mariani and
                  Jan Odijk and
                  Daniel Tapias},
  title        = {Transcription Cost Reduction for Constructing Acoustic Models Using
                  Acoustic Likelihood Selection Criteria},
  booktitle    = {Proceedings of the Fifth International Conference on Language Resources
                  and Evaluation, {LREC} 2006, Genoa, Italy, May 22-28, 2006},
  pages        = {789--792},
  publisher    = {European Language Resources Association {(ELRA)}},
  year         = {2006},
  url          = {http://www.lrec-conf.org/proceedings/lrec2006/summaries/344.html},
  timestamp    = {Mon, 19 Aug 2019 15:23:22 +0200},
  biburl       = {https://dblp.org/rec/conf/lrec/KatoTSS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/AdachiTKSS05,
  author       = {Kazuki Adachi and
                  Tomoki Toda and
                  Hiromichi Kawanami and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Designing Target Cost Function Based on Prosody of Speech Database},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {88-D},
  number       = {3},
  pages        = {519--524},
  year         = {2005},
  url          = {http://search.ieice.org/bin/summary.php?id=e88-d\_3\_519\&\#38;category=D\&\#38;year=2005\&\#38;lang=E\&\#38;abst=},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/AdachiTKSS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/UkaiTSSMS05,
  author       = {Satoshi Ukai and
                  Tomoya Takatani and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Ryo Mukai and
                  Hiroshi Sawada},
  title        = {Multistage SIMO-Model-Based Blind Source Separation Combining Frequency-Domain
                  {ICA} and Time-Domain {ICA}},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {88-A},
  number       = {3},
  pages        = {642--650},
  year         = {2005},
  url          = {https://doi.org/10.1093/ietfec/e88-a.3.642},
  doi          = {10.1093/IETFEC/E88-A.3.642},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/UkaiTSSMS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/AsaiSS05,
  author       = {Tatsunori Asai and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Interface for Barge-in Free Spoken Dialogue System Combining Adaptive
                  Sound Field Control and Microphone Array},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {88-A},
  number       = {6},
  pages        = {1613--1618},
  year         = {2005},
  url          = {https://doi.org/10.1093/ietfec/e88-a.6.1613},
  doi          = {10.1093/IETFEC/E88-A.6.1613},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/AsaiSS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/TakataniUNSS05,
  author       = {Tomoya Takatani and
                  Satoshi Ukai and
                  Tsuyoki Nishikawa and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {A Self-Generator Method for Initial Filters of {SIMO-ICA} Applied
                  to Blind Separation of Binaural Sound Mixtures},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {88-A},
  number       = {7},
  pages        = {1673--1682},
  year         = {2005},
  url          = {https://doi.org/10.1093/ietfec/e88-a.7.1673},
  doi          = {10.1093/IETFEC/E88-A.7.1673},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/TakataniUNSS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/PrasadSS05,
  author       = {Rajkishore Prasad and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Blind Separation of Speech by Fixed-Point {ICA} with Source Adaptive
                  Negentropy Approximation},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {88-A},
  number       = {7},
  pages        = {1683--1692},
  year         = {2005},
  url          = {https://doi.org/10.1093/ietfec/e88-a.7.1683},
  doi          = {10.1093/IETFEC/E88-A.7.1683},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/PrasadSS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/TatekuraUSS05,
  author       = {Yosuke Tatekura and
                  Shigefumi Urata and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {On-Line Relaxation Algorithm Applicable to Acoustic Fluctuation for
                  Inverse Filter in Multichannel Sound Reproduction System},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {88-A},
  number       = {7},
  pages        = {1747--1756},
  year         = {2005},
  url          = {https://doi.org/10.1093/ietfec/e88-a.7.1747},
  doi          = {10.1093/IETFEC/E88-A.7.1747},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/TatekuraUSS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/SaruwatariYTNS05,
  author       = {Hiroshi Saruwatari and
                  Hiroaki Yamajo and
                  Tomoya Takatani and
                  Tsuyoki Nishikawa and
                  Kiyohiro Shikano},
  title        = {Blind Separation and Deconvolution for Convolutive Mixture of Speech
                  Combining SIMO-Model-Based {ICA} and Multichannel Inverse Filtering},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {88-A},
  number       = {9},
  pages        = {2387--2400},
  year         = {2005},
  url          = {https://doi.org/10.1093/ietfec/e88-a.9.2387},
  doi          = {10.1093/IETFEC/E88-A.9.2387},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/SaruwatariYTNS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/ArakiMANS05,
  author       = {Shoko Araki and
                  Shoji Makino and
                  Robert Aichner and
                  Tsuyoki Nishikawa and
                  Hiroshi Saruwatari},
  title        = {Subband-Based Blind Separation for Convolutive Mixtures of Speech},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {88-A},
  number       = {12},
  pages        = {3593--3603},
  year         = {2005},
  url          = {https://doi.org/10.1093/ietfec/e88-a.12.3593},
  doi          = {10.1093/IETFEC/E88-A.12.3593},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ieicet/ArakiMANS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/npl/PrasadSS05,
  author       = {Rajkishore Prasad and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Estimation of Shape Parameter of {GGD} Function by Negentropy Matching},
  journal      = {Neural Process. Lett.},
  volume       = {22},
  number       = {3},
  pages        = {377--389},
  year         = {2005},
  url          = {https://doi.org/10.1007/s11063-005-1385-9},
  doi          = {10.1007/S11063-005-1385-9},
  timestamp    = {Thu, 09 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/npl/PrasadSS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusai/HeracleousNSS05,
  author       = {Panikos Heracleous and
                  Yoshitaka Nakajima and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {G{\'{e}}rard Bailly and
                  James L. Crowley},
  title        = {A tissue-conductive acoustic sensor applied in speech recognition
                  for privacy},
  booktitle    = {Proceedings of the 2005 joint conference on Smart objects and ambient
                  intelligence - innovative context-aware services: usages and technologies,
                  sOc-EUSAI '05, Grenoble, France, October 12-14, 2005},
  pages        = {93--97},
  publisher    = {{ACM}},
  year         = {2005},
  url          = {https://doi.org/10.1145/1107548.1107577},
  doi          = {10.1145/1107548.1107577},
  timestamp    = {Fri, 28 Jan 2022 11:34:47 +0100},
  biburl       = {https://dblp.org/rec/conf/eusai/HeracleousNSS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/MiyabeSST05,
  author       = {Shigeki Miyabe and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Yosuke Tatekura},
  title        = {Barge-in free spoken dialogue interface using nullspace-based sound
                  field control and beamforming},
  booktitle    = {13th European Signal Processing Conference, {EUSIPCO} 2005, Antalya,
                  Turkey, September 4-8, 2005},
  pages        = {1--4},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://ieeexplore.ieee.org/document/7078179/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/MiyabeSST05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/NishikawaSS05,
  author       = {Tsuyoki Nishikawa and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Blind separation of more than two sources based on high-convergence
                  algorithm combining {ICA} and beamforming},
  booktitle    = {13th European Signal Processing Conference, {EUSIPCO} 2005, Antalya,
                  Turkey, September 4-8, 2005},
  pages        = {1--4},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://ieeexplore.ieee.org/document/7078209/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/NishikawaSS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/SaruwatariUTNS05,
  author       = {Hiroshi Saruwatari and
                  Satoshi Ukai and
                  Tomoya Takatani and
                  Tsuyoki Nishikawa and
                  Kiyohiro Shikano},
  title        = {Two-stage blind source separation combining SIMO-model-based {ICA}
                  and adaptive beamforming},
  booktitle    = {13th European Signal Processing Conference, {EUSIPCO} 2005, Antalya,
                  Turkey, September 4-8, 2005},
  pages        = {1--4},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://ieeexplore.ieee.org/document/7078226/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/SaruwatariUTNS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/TakataniUNSS05,
  author       = {Tomoya Takatani and
                  Satoshi Ukai and
                  Tsuyoki Nishikawa and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Blind separation of binaural sound mixtures using {SIMO-ICA} with
                  self-generator for initial filter},
  booktitle    = {13th European Signal Processing Conference, {EUSIPCO} 2005, Antalya,
                  Turkey, September 4-8, 2005},
  pages        = {1--4},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://ieeexplore.ieee.org/document/7078282/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/TakataniUNSS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/UkaiTNS05,
  author       = {Satoshi Ukai and
                  Tomoya Takatani and
                  Tsuyoki Nishikawa and
                  Hiroshi Saruwatari},
  title        = {Blind source separation combining SIMO-model-based {ICA} and adaptive
                  beamforming},
  booktitle    = {2005 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} '05, Philadelphia, Pennsylvania, USA, March 18-23,
                  2005},
  pages        = {85--88},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://doi.org/10.1109/ICASSP.2005.1415652},
  doi          = {10.1109/ICASSP.2005.1415652},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/UkaiTNS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icde/SaruwatariSNLSKSS05,
  author       = {Hiroshi Saruwatari and
                  Katsuyuki Sawai and
                  Tsuyoki Nishikawa and
                  Akinobu Lee and
                  Kiyohiro Shikano and
                  Atsunobu Kaminuma and
                  Masao Sakata and
                  Daisuke Saitoh},
  title        = {Speech Enhancement Based on Blind Source Separation in Car Environments},
  booktitle    = {Proceedings of the 21st International Conference on Data Engineering
                  Workshops, {ICDE} 2005, 5-8 April 2005, Tokyo, Japan},
  pages        = {1205},
  publisher    = {{IEEE} Computer Society},
  year         = {2005},
  url          = {https://doi.org/10.1109/ICDE.2005.289},
  doi          = {10.1109/ICDE.2005.289},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icde/SaruwatariSNLSKSS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/GomezLSS05,
  author       = {Randy Gomez and
                  Akinobu Lee and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Rapid unsupervised speaker adaptation based on multi-template {HMM}
                  sufficient statistics in noisy environments},
  booktitle    = {{INTERSPEECH} 2005 - Eurospeech, 9th European Conference on Speech
                  Communication and Technology, Lisbon, Portugal, September 4-8, 2005},
  pages        = {293--296},
  publisher    = {{ISCA}},
  year         = {2005},
  url          = {https://doi.org/10.21437/Interspeech.2005-161},
  doi          = {10.21437/INTERSPEECH.2005-161},
  timestamp    = {Thu, 22 Jun 2023 16:42:16 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/GomezLSS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SaitohKSNL05,
  author       = {Daisuke Saitoh and
                  Atsunobu Kaminuma and
                  Hiroshi Saruwatari and
                  Tsuyoki Nishikawa and
                  Akinobu Lee},
  title        = {Speech extraction in a car interior using frequency-domain {ICA} with
                  rapid filter adaptations},
  booktitle    = {{INTERSPEECH} 2005 - Eurospeech, 9th European Conference on Speech
                  Communication and Technology, Lisbon, Portugal, September 4-8, 2005},
  pages        = {2301--2304},
  publisher    = {{ISCA}},
  year         = {2005},
  url          = {https://doi.org/10.21437/Interspeech.2005-736},
  doi          = {10.21437/INTERSPEECH.2005-736},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SaitohKSNL05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HeracleousKSS05,
  author       = {Panikos Heracleous and
                  Tomomi Kaino and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Investigating the role of the Lombard reflex in non-audible murmur
                  {(NAM)} recognition},
  booktitle    = {{INTERSPEECH} 2005 - Eurospeech, 9th European Conference on Speech
                  Communication and Technology, Lisbon, Portugal, September 4-8, 2005},
  pages        = {2649--2652},
  publisher    = {{ISCA}},
  year         = {2005},
  url          = {https://doi.org/10.21437/Interspeech.2005-251},
  doi          = {10.21437/INTERSPEECH.2005-251},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HeracleousKSS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HeracleousKSS05a,
  author       = {Panikos Heracleous and
                  Tomomi Kaino and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Applications of {NAM} microphones in speech recognition for privacy
                  in human-machine communication},
  booktitle    = {{INTERSPEECH} 2005 - Eurospeech, 9th European Conference on Speech
                  Communication and Technology, Lisbon, Portugal, September 4-8, 2005},
  pages        = {3041--3044},
  publisher    = {{ISCA}},
  year         = {2005},
  url          = {https://doi.org/10.21437/Interspeech.2005-149},
  doi          = {10.21437/INTERSPEECH.2005-149},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HeracleousKSS05a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/TakataniUNSS05,
  author       = {Tomoya Takatani and
                  Satoshi Ukai and
                  Tsuyoki Nishikawa and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Blind sound scene decomposition for robot audition using SIMO-model-based
                  {ICA}},
  booktitle    = {2005 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, Edmonton, Alberta, Canada, August 2-6, 2005},
  pages        = {2247--2252},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://doi.org/10.1109/IROS.2005.1544984},
  doi          = {10.1109/IROS.2005.1544984},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/TakataniUNSS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/SaruwatariMTUSHM05,
  author       = {Hiroshi Saruwatari and
                  Yoshimitsu Mori and
                  Tomoya Takatani and
                  Satoshi Ukai and
                  Kiyohiro Shikano and
                  Takashi Hiekata and
                  Takashi Morita},
  title        = {Two-stage blind source separation based on {ICA} and binary masking
                  for real-time robot audition system},
  booktitle    = {2005 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, Edmonton, Alberta, Canada, August 2-6, 2005},
  pages        = {2303--2308},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://doi.org/10.1109/IROS.2005.1544983},
  doi          = {10.1109/IROS.2005.1544983},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/SaruwatariMTUSHM05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/OhashiNSLS05,
  author       = {Yasuaki Ohashi and
                  Tsuyoki Nishikawa and
                  Hiroshi Saruwatari and
                  Akinobu Lee and
                  Kiyohiro Shikano},
  title        = {Noise-robust hands-free speech recognition based on spatial subtraction
                  array and known noise superimposition},
  booktitle    = {2005 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, Edmonton, Alberta, Canada, August 2-6, 2005},
  pages        = {2328--2332},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://doi.org/10.1109/IROS.2005.1545036},
  doi          = {10.1109/IROS.2005.1545036},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/OhashiNSLS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ar/PrasadSS04,
  author       = {Rajkishore Prasad and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Robots that can hear, understand and talk},
  journal      = {Adv. Robotics},
  volume       = {18},
  number       = {5},
  pages        = {533--564},
  year         = {2004},
  url          = {https://doi.org/10.1163/156855304774195064},
  doi          = {10.1163/156855304774195064},
  timestamp    = {Sat, 30 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ar/PrasadSS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieiceee/PrasadSS04,
  author       = {Rajkishore Prasad and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Negentropy based voice-activity detection for noise estimation in
                  very low {SNR} condition},
  journal      = {{IEICE} Electron. Express},
  volume       = {1},
  number       = {16},
  pages        = {495--500},
  year         = {2004},
  url          = {https://doi.org/10.1587/elex.1.495},
  doi          = {10.1587/ELEX.1.495},
  timestamp    = {Fri, 10 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieiceee/PrasadSS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/HeracleousNLSS04,
  author       = {Panikos Heracleous and
                  Yoshitaka Nakajima and
                  Akinobu Lee and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Audible (normal) speech and inaudible murmur recognition using {NAM}
                  microphone},
  booktitle    = {2004 12th European Signal Processing Conference, Vienna, Austria,
                  September 6-10, 2004},
  pages        = {329--332},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://ieeexplore.ieee.org/document/7079711/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/HeracleousNLSS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/YamajoSTNS04,
  author       = {Hiroaki Yamajo and
                  Hiroshi Saruwatari and
                  Tomoya Takatani and
                  Tsuyoki Nishikawa and
                  Kiyohiro Shikano},
  title        = {Evaluation of blind separation and deconvolution for binaural-sound
                  mixtures using SIMO-model-based {ICA}},
  booktitle    = {2004 12th European Signal Processing Conference, Vienna, Austria,
                  September 6-10, 2004},
  pages        = {1709--1712},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://ieeexplore.ieee.org/document/7080136/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/YamajoSTNS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/TatekuraUSS04,
  author       = {Yosuke Tatekura and
                  Shigefumi Urata and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {On-line adaptive algorithm to acoustic fluctuation for inverse filter
                  relaxation in sound reproduction system},
  booktitle    = {2004 12th European Signal Processing Conference, Vienna, Austria,
                  September 6-10, 2004},
  pages        = {1765--1768},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://ieeexplore.ieee.org/document/7079842/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/TatekuraUSS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ica/UkaiSTSMS04,
  author       = {Satoshi Ukai and
                  Hiroshi Saruwatari and
                  Tomoya Takatani and
                  Kiyohiro Shikano and
                  Ryo Mukai and
                  Hiroshi Sawada},
  editor       = {Carlos Garc{\'{\i}}a Puntonet and
                  Alberto Prieto},
  title        = {Evaluation of Multistage SIMO-Model-Based Blind Source Separation
                  Combining Frequency-Domain {ICA} and Time-Domain {ICA}},
  booktitle    = {Independent Component Analysis and Blind Signal Separation, Fifth
                  International Conference, {ICA} 2004, Granada, Spain, September 22-24,
                  2004, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {3195},
  pages        = {626--633},
  publisher    = {Springer},
  year         = {2004},
  url          = {https://doi.org/10.1007/978-3-540-30110-3\_80},
  doi          = {10.1007/978-3-540-30110-3\_80},
  timestamp    = {Tue, 14 May 2019 10:00:52 +0200},
  biburl       = {https://dblp.org/rec/conf/ica/UkaiSTSMS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ica/PrasadSS04,
  author       = {Rajkishore Prasad and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Carlos Garc{\'{\i}}a Puntonet and
                  Alberto Prieto},
  title        = {Single Channel Speech Enhancement: {MAP} Estimation Using {GGD} Prior
                  Under Blind Setup},
  booktitle    = {Independent Component Analysis and Blind Signal Separation, Fifth
                  International Conference, {ICA} 2004, Granada, Spain, September 22-24,
                  2004, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {3195},
  pages        = {873--880},
  publisher    = {Springer},
  year         = {2004},
  url          = {https://doi.org/10.1007/978-3-540-30110-3\_110},
  doi          = {10.1007/978-3-540-30110-3\_110},
  timestamp    = {Wed, 24 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ica/PrasadSS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ica/NishikawaSSK04,
  author       = {Tsuyoki Nishikawa and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Atsunobu Kaminuma},
  editor       = {Carlos Garc{\'{\i}}a Puntonet and
                  Alberto Prieto},
  title        = {Stable and Low-Distortion Algorithm Based on Overdetermined Blind
                  Separation for Convolutive Mixtures of Speech},
  booktitle    = {Independent Component Analysis and Blind Signal Separation, Fifth
                  International Conference, {ICA} 2004, Granada, Spain, September 22-24,
                  2004, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {3195},
  pages        = {881--888},
  publisher    = {Springer},
  year         = {2004},
  url          = {https://doi.org/10.1007/978-3-540-30110-3\_111},
  doi          = {10.1007/978-3-540-30110-3\_111},
  timestamp    = {Wed, 24 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ica/NishikawaSSK04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/UkaiSTMS04,
  author       = {Satoshi Ukai and
                  Hiroshi Saruwatari and
                  Tomoya Takatani and
                  Ryo Mukai and
                  Hiroshi Sawada},
  title        = {Multistage SIMO-model-based blind source separation combining frequency-domain
                  {ICA} and time-domain {ICA}},
  booktitle    = {2004 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} 2004, Montreal, Quebec, Canada, May 17-21, 2004},
  pages        = {109--112},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://doi.org/10.1109/ICASSP.2004.1326775},
  doi          = {10.1109/ICASSP.2004.1326775},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/UkaiSTMS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TakataniNSS04,
  author       = {Tomoya Takatani and
                  Tsuyoki Nishikawa and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Blind separation of binaural sound mixtures using SIMO-model-based
                  independent component analysis},
  booktitle    = {2004 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} 2004, Montreal, Quebec, Canada, May 17-21, 2004},
  pages        = {113--116},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://doi.org/10.1109/ICASSP.2004.1326776},
  doi          = {10.1109/ICASSP.2004.1326776},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/TakataniNSS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/NishikawaASS04,
  author       = {Tsuyoki Nishikawa and
                  Hiroshi Abe and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Overdetermined blind separation for convolutive mixtures of speech
                  based on multistage {ICA} using subarray processing},
  booktitle    = {2004 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} 2004, Montreal, Quebec, Canada, May 17-21, 2004},
  pages        = {225--228},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://doi.org/10.1109/ICASSP.2004.1325963},
  doi          = {10.1109/ICASSP.2004.1325963},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/NishikawaASS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/NisimuraLSS04,
  author       = {Ryuichi Nisimura and
                  Akinobu Lee and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Public speech-oriented guidance system with adult and child discrimination
                  capability},
  booktitle    = {2004 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} 2004, Montreal, Quebec, Canada, May 17-21, 2004},
  pages        = {433--436},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://doi.org/10.1109/ICASSP.2004.1326015},
  doi          = {10.1109/ICASSP.2004.1326015},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/NisimuraLSS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/PrasadSS04,
  author       = {Rajkishore Prasad and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {{MAP} estimation of speech spectral component under {GGD} a priori},
  booktitle    = {{ISCA} Tutorial and Research Workshop on Statistical and Perceptual
                  Audio Processing, ICC, Jeju, Korea, October 3, 2004},
  pages        = {115},
  publisher    = {{ISCA}},
  year         = {2004},
  url          = {https://www.isca-speech.org/archive\_open/sapa\_04/sap4\_115.html},
  timestamp    = {Tue, 11 Jul 2023 11:45:03 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/PrasadSS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LeeNNSS04,
  author       = {Akinobu Lee and
                  Keisuke Nakamura and
                  Ryuichi Nisimura and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Noise robust real world spoken dialogue system using {GMM} based rejection
                  of unintended inputs},
  booktitle    = {{INTERSPEECH} 2004 - ICSLP, 8th International Conference on Spoken
                  Language Processing, Jeju Island, Korea, October 4-8, 2004},
  pages        = {173--176},
  publisher    = {{ISCA}},
  year         = {2004},
  url          = {https://doi.org/10.21437/Interspeech.2004-111},
  doi          = {10.21437/INTERSPEECH.2004-111},
  timestamp    = {Thu, 22 Jun 2023 16:42:17 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/LeeNNSS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HeracleousNLSS04,
  author       = {Panikos Heracleous and
                  Yoshitaka Nakajima and
                  Akinobu Lee and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Non-audible murmur {(NAM)} speech recognition using a stethoscopic
                  {NAM} microphone},
  booktitle    = {{INTERSPEECH} 2004 - ICSLP, 8th International Conference on Spoken
                  Language Processing, Jeju Island, Korea, October 4-8, 2004},
  pages        = {1469--1472},
  publisher    = {{ISCA}},
  year         = {2004},
  url          = {https://doi.org/10.21437/Interspeech.2004-559},
  doi          = {10.21437/INTERSPEECH.2004-559},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HeracleousNLSS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/GomezLSS04,
  author       = {Randy Gomez and
                  Akinobu Lee and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Robust speech recognition with spectral subtraction in low {SNR}},
  booktitle    = {{INTERSPEECH} 2004 - ICSLP, 8th International Conference on Spoken
                  Language Processing, Jeju Island, Korea, October 4-8, 2004},
  pages        = {2077--2080},
  publisher    = {{ISCA}},
  year         = {2004},
  url          = {https://doi.org/10.21437/Interspeech.2004-633},
  doi          = {10.21437/INTERSPEECH.2004-633},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/GomezLSS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/AsaiMSS04,
  author       = {Tatsunori Asai and
                  Shigeki Miyabe and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Interface for barge-in free spoken dialogue system using adaptive
                  sound field control},
  booktitle    = {{INTERSPEECH} 2004 - ICSLP, 8th International Conference on Spoken
                  Language Processing, Jeju Island, Korea, October 4-8, 2004},
  pages        = {2665--2668},
  publisher    = {{ISCA}},
  year         = {2004},
  url          = {https://doi.org/10.21437/Interspeech.2004-708},
  doi          = {10.21437/INTERSPEECH.2004-708},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/AsaiMSS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lrec/AdachiTKSS04,
  author       = {Kazuki Adachi and
                  Tomoki Toda and
                  Hiromichi Kawanami and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Perceptual Evaluation of Quality Deterioration Owing to Prosody Modification},
  booktitle    = {Proceedings of the Fourth International Conference on Language Resources
                  and Evaluation, {LREC} 2004, May 26-28, 2004, Lisbon, Portugal},
  publisher    = {European Language Resources Association},
  year         = {2004},
  url          = {http://www.lrec-conf.org/proceedings/lrec2004/summaries/681.htm},
  timestamp    = {Mon, 19 Aug 2019 15:22:43 +0200},
  biburl       = {https://dblp.org/rec/conf/lrec/AdachiTKSS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ejasp/SaruwatariKTINS03,
  author       = {Hiroshi Saruwatari and
                  Satoshi Kurita and
                  Kazuya Takeda and
                  Fumitada Itakura and
                  Tsuyoki Nishikawa and
                  Kiyohiro Shikano},
  title        = {Blind Source Separation Combining Independent Component Analysis and
                  Beamforming},
  journal      = {{EURASIP} J. Adv. Signal Process.},
  volume       = {2003},
  number       = {11},
  pages        = {1135--1146},
  year         = {2003},
  url          = {https://doi.org/10.1155/S1110865703305104},
  doi          = {10.1155/S1110865703305104},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ejasp/SaruwatariKTINS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ejasp/ArakiMHMNS03,
  author       = {Shoko Araki and
                  Shoji Makino and
                  Yoichi Hinamoto and
                  Ryo Mukai and
                  Tsuyoki Nishikawa and
                  Hiroshi Saruwatari},
  title        = {Equivalence between Frequency-Domain Blind Source Separation and Frequency-Domain
                  Adaptive Beamforming for Convolutive Mixtures},
  journal      = {{EURASIP} J. Adv. Signal Process.},
  volume       = {2003},
  number       = {11},
  pages        = {1157--1166},
  year         = {2003},
  url          = {https://doi.org/10.1155/S1110865703305074},
  doi          = {10.1155/S1110865703305074},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ejasp/ArakiMHMNS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieiceta/SaruwatariKNS03,
  author       = {Hiroshi Saruwatari and
                  Toshiya Kawamura and
                  Tsuyoki Nishikawa and
                  Kiyohiro Shikano},
  title        = {Fast-Convergence Algorithm for Blind Source Separation Based on Array
                  Signal Processing},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {86-A},
  number       = {3},
  pages        = {634--639},
  year         = {2003},
  url          = {http://search.ieice.org/bin/summary.php?id=e86-a\_3\_634},
  timestamp    = {Tue, 08 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieiceta/SaruwatariKNS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieiceta/NishikawaSS03,
  author       = {Tsuyoki Nishikawa and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Blind Source Separation of Acoustic Signals Based on Multistage {ICA}
                  Combining Frequency-Domain {ICA} and Time-Domain {ICA}},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {86-A},
  number       = {4},
  pages        = {846--858},
  year         = {2003},
  url          = {http://search.ieice.org/bin/summary.php?id=e86-a\_4\_846},
  timestamp    = {Tue, 08 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieiceta/NishikawaSS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieiceta/NishikawaSS03a,
  author       = {Tsuyoki Nishikawa and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Stable Learning Algorithm for Blind Separation of Temporally Correlated
                  Acoustic Signals Combining Multistage {ICA} and Linear Prediction},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {86-A},
  number       = {8},
  pages        = {2028--2036},
  year         = {2003},
  url          = {http://search.ieice.org/bin/summary.php?id=e86-a\_8\_2028},
  timestamp    = {Tue, 08 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieiceta/NishikawaSS03a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/ArakiMMNS03,
  author       = {Shoko Araki and
                  Ryo Mukai and
                  Shoji Makino and
                  Tsuyoki Nishikawa and
                  Hiroshi Saruwatari},
  title        = {The fundamental limitation of frequency domain blind source separation
                  for convolutive mixtures of speech},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {11},
  number       = {2},
  pages        = {109--116},
  year         = {2003},
  url          = {https://doi.org/10.1109/TSA.2003.809193},
  doi          = {10.1109/TSA.2003.809193},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/ArakiMMNS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TakataniNS03,
  author       = {Tomoya Takatani and
                  Tsuyoki Nishikawa and
                  Hiroshi Saruwatari},
  title        = {Blind source separation based on binaural {ICA}},
  booktitle    = {2003 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} '03, Hong Kong, April 6-10, 2003},
  pages        = {321--324},
  publisher    = {{IEEE}},
  year         = {2003},
  url          = {https://doi.org/10.1109/ICASSP.2003.1199940},
  doi          = {10.1109/ICASSP.2003.1199940},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/TakataniNS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HinamotoMSS03,
  author       = {Yoichi Hinamoto and
                  Kouichi Mino and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Interface for barge-in free spoken dialogue system based on sound
                  field control and microphone array},
  booktitle    = {2003 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} '03, Hong Kong, April 6-10, 2003},
  pages        = {505--508},
  publisher    = {{IEEE}},
  year         = {2003},
  url          = {https://doi.org/10.1109/ICASSP.2003.1200017},
  doi          = {10.1109/ICASSP.2003.1200017},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/HinamotoMSS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ArakiMANS03,
  author       = {Shoko Araki and
                  Shoji Makino and
                  Robert Aichner and
                  Tsuyoki Nishikawa and
                  Hiroshi Saruwatari},
  title        = {Subband based blind source separation for convolutive mixtures of
                  speech},
  booktitle    = {2003 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} '03, Hong Kong, April 6-10, 2003},
  pages        = {509--512},
  publisher    = {{IEEE}},
  year         = {2003},
  url          = {https://doi.org/10.1109/ICASSP.2003.1200018},
  doi          = {10.1109/ICASSP.2003.1200018},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ArakiMANS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/YamajoSTNS03,
  author       = {Hiroaki Yamajo and
                  Hiroshi Saruwatari and
                  Tomoya Takatani and
                  Tsuyoki Nishikawa and
                  Kiyohiro Shikano},
  title        = {Blind separation and deconvolution for convolutive mixture of speech
                  using SIMO-model-based {ICA} and multichannel inverse filtering},
  booktitle    = {8th European Conference on Speech Communication and Technology, {EUROSPEECH}
                  2003 - {INTERSPEECH} 2003, Geneva, Switzerland, September 1-4, 2003},
  pages        = {537--540},
  publisher    = {{ISCA}},
  year         = {2003},
  url          = {https://doi.org/10.21437/Eurospeech.2003-220},
  doi          = {10.21437/EUROSPEECH.2003-220},
  timestamp    = {Thu, 22 Jun 2023 16:42:17 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/YamajoSTNS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/YamadeLSS03,
  author       = {Shingo Yamade and
                  Akinobu Lee and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Unsupervised speaker adaptation based on {HMM} sufficient statistics
                  in various noisy environments},
  booktitle    = {8th European Conference on Speech Communication and Technology, {EUROSPEECH}
                  2003 - {INTERSPEECH} 2003, Geneva, Switzerland, September 1-4, 2003},
  pages        = {1493--1496},
  publisher    = {{ISCA}},
  year         = {2003},
  url          = {https://doi.org/10.21437/Eurospeech.2003-434},
  doi          = {10.21437/EUROSPEECH.2003-434},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/YamadeLSS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ShiraishiTKSS03,
  author       = {Tatsuya Shiraishi and
                  Tomoki Toda and
                  Hiromichi Kawanami and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Simple designing methods of corpus-based visual speech synthesis},
  booktitle    = {8th European Conference on Speech Communication and Technology, {EUROSPEECH}
                  2003 - {INTERSPEECH} 2003, Geneva, Switzerland, September 1-4, 2003},
  pages        = {2241--2244},
  publisher    = {{ISCA}},
  year         = {2003},
  url          = {https://doi.org/10.21437/Eurospeech.2003-627},
  doi          = {10.21437/EUROSPEECH.2003-627},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ShiraishiTKSS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/KawanamiITSS03,
  author       = {Hiromichi Kawanami and
                  Yohei Iwami and
                  Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {GMM-based voice conversion applied to emotional speech synthesis},
  booktitle    = {8th European Conference on Speech Communication and Technology, {EUROSPEECH}
                  2003 - {INTERSPEECH} 2003, Geneva, Switzerland, September 1-4, 2003},
  pages        = {2401--2404},
  publisher    = {{ISCA}},
  year         = {2003},
  url          = {https://doi.org/10.21437/Eurospeech.2003-661},
  doi          = {10.21437/EUROSPEECH.2003-661},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/KawanamiITSS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isspa/TakataniNSS03,
  author       = {Tomoya Takatani and
                  Tsuyoki Nishikawa and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {High-fidelity blind separation for convolutive mixture of acoustic
                  signals using SIMO-model-based independent component analysis},
  booktitle    = {Seventh International Symposium on Signal Processing and Its Applications,
                  {ISSPA} 2003, July 1-4, 2003, Paris, France, Proceedings, Volume 2},
  pages        = {77--80},
  publisher    = {{IEEE}},
  year         = {2003},
  url          = {https://doi.org/10.1109/ISSPA.2003.1224819},
  doi          = {10.1109/ISSPA.2003.1224819},
  timestamp    = {Wed, 16 Oct 2019 14:14:56 +0200},
  biburl       = {https://dblp.org/rec/conf/isspa/TakataniNSS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nnsp/SaruwatariYTNS03,
  author       = {Hiroshi Saruwatari and
                  Hiroaki Yamajo and
                  Tomoya Takatani and
                  Tsuyoki Nishikawa and
                  Kiyohiro Shikano},
  title        = {Blind separation and deconvolution of {MIMO} system driven by colored
                  inputs using SIMO-model-based {ICA} with information-geometric learning},
  booktitle    = {{NNSP} 2003, {IEEE} {XIII} Workshop on Neural Networks for Signal
                  Processing, Toulouse, France, September 17-19, 2003},
  pages        = {379--388},
  publisher    = {{IEEE}},
  year         = {2003},
  url          = {https://doi.org/10.1109/NNSP.2003.1318037},
  doi          = {10.1109/NNSP.2003.1318037},
  timestamp    = {Wed, 16 Oct 2019 14:14:54 +0200},
  biburl       = {https://dblp.org/rec/conf/nnsp/SaruwatariYTNS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nolisp/NishikawaSS03,
  author       = {Tsuyoki Nishikawa and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Stable learning algorithm for low-distortion blind separation of real
                  speech mixture combining multistage {ICA} and linear prediction},
  booktitle    = {{ITRW} on Non-Linear Speech Processing, {NOLISP} 03, Le Croisic, France,
                  May 20-23, 2003},
  pages        = {8},
  publisher    = {{ISCA}},
  year         = {2003},
  url          = {http://www.isca-speech.org/archive\_open/nolisp03/nl03\_008.html},
  timestamp    = {Tue, 08 Apr 2014 18:09:26 +0200},
  biburl       = {https://dblp.org/rec/conf/nolisp/NishikawaSS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieiceta/TatekuraSS02,
  author       = {Yosuke Tatekura and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Sound Reproduction System Including Adaptive Compensation of Temperature
                  Fluctuation Effect for Broad-Band Sound Control},
  journal      = {{IEICE} Trans. Fundam. Electron. Commun. Comput. Sci.},
  volume       = {85-A},
  number       = {8},
  pages        = {1851--1860},
  year         = {2002},
  url          = {http://search.ieice.org/bin/summary.php?id=e85-a\_8\_1851},
  timestamp    = {Wed, 09 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieiceta/TatekuraSS02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/NishikawaSS02,
  author       = {Tsuyoki Nishikawa and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Comparison of time-domain ICA, frequency-domain {ICA} and multistage
                  {ICA} for blind source separation},
  booktitle    = {11th European Signal Processing Conference, {EUSIPCO} 2002, Toulouse,
                  France, September 3-6, 2002},
  pages        = {1--4},
  publisher    = {{IEEE}},
  year         = {2002},
  url          = {https://ieeexplore.ieee.org/document/7071932/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/NishikawaSS02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/SaruwatariKSSKS02,
  author       = {Hiroshi Saruwatari and
                  Toshiya Kawamura and
                  Katsuyuki Sawai and
                  Kiyohiro Shikano and
                  Atsunobu Kaminuma and
                  Masao Sakata},
  title        = {Evaluation of fast-convergence algorithm for ICA-based blind source
                  separation of real convolutive mixture},
  booktitle    = {11th European Signal Processing Conference, {EUSIPCO} 2002, Toulouse,
                  France, September 3-6, 2002},
  pages        = {1--4},
  publisher    = {{IEEE}},
  year         = {2002},
  url          = {https://ieeexplore.ieee.org/document/7072211/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/SaruwatariKSSKS02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/TatekuraSS02,
  author       = {Yosuke Tatekura and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Adaptive compensation of temperature fluctuation effect in sound reproduction
                  system},
  booktitle    = {11th European Signal Processing Conference, {EUSIPCO} 2002, Toulouse,
                  France, September 3-6, 2002},
  pages        = {1--4},
  publisher    = {{IEEE}},
  year         = {2002},
  url          = {https://ieeexplore.ieee.org/document/7071928/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/TatekuraSS02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/NishikawaSS02,
  author       = {Tsuyoki Nishikawa and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Bund source separation based on Multi-Stage {ICA} combining frequency-domain
                  {ICA} and time-domain {ICA}},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2002, May 13-17 2002, Orlando, Florida,
                  {USA}},
  pages        = {917--920},
  publisher    = {{IEEE}},
  year         = {2002},
  url          = {https://doi.org/10.1109/ICASSP.2002.5743889},
  doi          = {10.1109/ICASSP.2002.5743889},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/NishikawaSS02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SaruwatariKSKS02,
  author       = {Hiroshi Saruwatari and
                  Toshiya Kawamura and
                  Katsuyuki Sawai and
                  Atsunobu Kaminuma and
                  Masao Sakata},
  title        = {Blind source separation based on fast-convergence algorithm using
                  {ICA} and beamforming for real convolutive mixture},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2002, May 13-17 2002, Orlando, Florida,
                  {USA}},
  pages        = {921--924},
  publisher    = {{IEEE}},
  year         = {2002},
  url          = {https://doi.org/10.1109/ICASSP.2002.5743890},
  doi          = {10.1109/ICASSP.2002.5743890},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/SaruwatariKSKS02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ArakiHMNMS02,
  author       = {Shoko Araki and
                  Yoichi Hinamoto and
                  Shoji Makino and
                  Tsuyoki Nishikawa and
                  Ryo Mukai and
                  Hiroshi Saruwatari},
  title        = {Equivalence between frequency domain blind source separation and frequency
                  domain adaptive beamforming},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2002, May 13-17 2002, Orlando, Florida,
                  {USA}},
  pages        = {1785--1788},
  publisher    = {{IEEE}},
  year         = {2002},
  url          = {https://doi.org/10.1109/ICASSP.2002.5744969},
  doi          = {10.1109/ICASSP.2002.5744969},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ArakiHMNMS02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icdsp/TatekuraSS02,
  author       = {Yosuke Tatekura and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Sound reproduction system with adaptive compensation of temperature
                  fluctuation effect},
  booktitle    = {14th International Conference on Digital Signal Processing, {DSP}
                  2002, Santorini, Greece, July 1-3, 2002},
  pages        = {989--992},
  publisher    = {{IEEE}},
  year         = {2002},
  url          = {https://doi.org/10.1109/ICDSP.2002.1028256},
  doi          = {10.1109/ICDSP.2002.1028256},
  timestamp    = {Tue, 02 Feb 2021 15:02:09 +0100},
  biburl       = {https://dblp.org/rec/conf/icdsp/TatekuraSS02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icmcs/NakamuraHAKYNKIS02,
  author       = {Satoshi Nakamura and
                  Kazuo Hiyane and
                  Futoshi Asano and
                  Yutaka Kaneda and
                  Takeshi Yamada and
                  Takanobu Nishiura and
                  Tetsunori Kobayashi and
                  Shiro Ise and
                  Hiroshi Saruwatari},
  title        = {Design and collection of acoustic sound data for hands-free speech
                  recognition and sound scene understanding},
  booktitle    = {Proceedings of the 2002 {IEEE} International Conference on Multimedia
                  and Expo, {ICME} 2002, Lausanne, Switzerland. August 26-29, 2002.
                  Volume {II}},
  pages        = {161--164},
  publisher    = {{IEEE} Computer Society},
  year         = {2002},
  url          = {https://doi.org/10.1109/ICME.2002.1035537},
  doi          = {10.1109/ICME.2002.1035537},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icmcs/NakamuraHAKYNKIS02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/YamadeMBLSS02,
  author       = {Shingo Yamade and
                  Kanako Matsunami and
                  Akira Baba and
                  Akinobu Lee and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {John H. L. Hansen and
                  Bryan L. Pellom},
  title        = {Spectral subtraction in noisy environments applied to speaker adaptation
                  based on {HMM} sufficient statistics},
  booktitle    = {7th International Conference on Spoken Language Processing, {ICSLP2002}
                  - {INTERSPEECH} 2002, Denver, Colorado, USA, September 16-20, 2002},
  pages        = {1045--1048},
  publisher    = {{ISCA}},
  year         = {2002},
  url          = {https://doi.org/10.21437/ICSLP.2002-33},
  doi          = {10.21437/ICSLP.2002-33},
  timestamp    = {Thu, 22 Jun 2023 16:42:18 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/YamadeMBLSS02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SaruwatariSLSKS02,
  author       = {Hiroshi Saruwatari and
                  Katsuyuki Sawai and
                  Akinobu Lee and
                  Kiyohiro Shikano and
                  Atsunobu Kaminuma and
                  Masao Sakata},
  editor       = {John H. L. Hansen and
                  Bryan L. Pellom},
  title        = {Speech enhancement in car environment using blind source separation},
  booktitle    = {7th International Conference on Spoken Language Processing, {ICSLP2002}
                  - {INTERSPEECH} 2002, Denver, Colorado, USA, September 16-20, 2002},
  pages        = {1781--1784},
  publisher    = {{ISCA}},
  year         = {2002},
  url          = {https://doi.org/10.21437/ICSLP.2002-262},
  doi          = {10.21437/ICSLP.2002-262},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SaruwatariSLSKS02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LeeMSS02,
  author       = {Akinobu Lee and
                  Yuichiro Mera and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {John H. L. Hansen and
                  Bryan L. Pellom},
  title        = {Selective multi-path acoustic model based on database likelihoods},
  booktitle    = {7th International Conference on Spoken Language Processing, {ICSLP2002}
                  - {INTERSPEECH} 2002, Denver, Colorado, USA, September 16-20, 2002},
  pages        = {2661--2664},
  publisher    = {{ISCA}},
  year         = {2002},
  url          = {https://doi.org/10.21437/ICSLP.2002-356},
  doi          = {10.21437/ICSLP.2002-356},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/LeeMSS02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/NisimuraULSSM02,
  author       = {Ryuichi Nisimura and
                  Takashi Uchida and
                  Akinobu Lee and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano and
                  Yoshio Matsumoto},
  title        = {{ASKA:} receptionist robot with speech dialogue system},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  Lausanne, Switzerland, September 30 - October 4, 2002},
  pages        = {1314--1319},
  publisher    = {{IEEE}},
  year         = {2002},
  url          = {https://doi.org/10.1109/IRDS.2002.1043936},
  doi          = {10.1109/IRDS.2002.1043936},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/NisimuraULSSM02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nnsp/AichnerAMNS02,
  author       = {Robert Aichner and
                  Shoko Araki and
                  Shoji Makino and
                  Tsuyoki Nishikawa and
                  Hiroshi Saruwatari},
  title        = {Time domain blind source separation of non-stationary convolved signals
                  by utilizing geometric beamforming},
  booktitle    = {Proceedings of the 12th {IEEE} Workshop on Neural Networks for Signal
                  Processing, {NNSP} 2002, Martigny, Valais, Switzerland, September
                  4-6, 2002},
  pages        = {445--454},
  publisher    = {{IEEE}},
  year         = {2002},
  url          = {https://doi.org/10.1109/NNSP.2002.1030056},
  doi          = {10.1109/NNSP.2002.1030056},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nnsp/AichnerAMNS02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TodaSS01,
  author       = {Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Voice conversion algorithm based on Gaussian mixture model with dynamic
                  frequency warping of {STRAIGHT} spectrum},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing,
                  {ICASSP} 2001, 7-11 May, 2001, Salt Palace Convention Center, Salt
                  Lake City, Utah, USA, Proceedings},
  pages        = {841--844},
  publisher    = {{IEEE}},
  year         = {2001},
  url          = {https://doi.org/10.1109/ICASSP.2001.941046},
  doi          = {10.1109/ICASSP.2001.941046},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/TodaSS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SaruwatariKT01,
  author       = {Hiroshi Saruwatari and
                  Satoshi Kurita and
                  Kazuya Takeda},
  title        = {Blind source separation combining frequency-domain {ICA} and beamforming},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing,
                  {ICASSP} 2001, 7-11 May, 2001, Salt Palace Convention Center, Salt
                  Lake City, Utah, USA, Proceedings},
  pages        = {2733--2736},
  publisher    = {{IEEE}},
  year         = {2001},
  url          = {https://doi.org/10.1109/ICASSP.2001.940211},
  doi          = {10.1109/ICASSP.2001.940211},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/SaruwatariKT01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ArakiMNS01,
  author       = {Shoko Araki and
                  Shoji Makino and
                  Tsuyoki Nishikawa and
                  Hiroshi Saruwatari},
  title        = {Fundamental limitation of frequency domain blind source separation
                  for convolutive mixture of speech},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing,
                  {ICASSP} 2001, 7-11 May, 2001, Salt Palace Convention Center, Salt
                  Lake City, Utah, USA, Proceedings},
  pages        = {2737--2740},
  publisher    = {{IEEE}},
  year         = {2001},
  url          = {https://doi.org/10.1109/ICASSP.2001.940212},
  doi          = {10.1109/ICASSP.2001.940212},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/ArakiMNS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KamiyanagidaSTI01,
  author       = {Hidekazu Kamiyanagida and
                  Hiroshi Saruwatari and
                  Kazuya Takeda and
                  Fumitada Itakura},
  title        = {Direction of arrival estimation based on nonlinear microphone array},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing,
                  {ICASSP} 2001, 7-11 May, 2001, Salt Palace Convention Center, Salt
                  Lake City, Utah, USA, Proceedings},
  pages        = {3033--3036},
  publisher    = {{IEEE}},
  year         = {2001},
  url          = {https://doi.org/10.1109/ICASSP.2001.940297},
  doi          = {10.1109/ICASSP.2001.940297},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/KamiyanagidaSTI01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/TodaSS01,
  author       = {Tomoki Toda and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Paul Dalsgaard and
                  B{\o}rge Lindberg and
                  Henrik Benner and
                  Zheng{-}Hua Tan},
  title        = {High quality voice conversion based on Gaussian mixture model with
                  dynamic frequency warping},
  booktitle    = {{EUROSPEECH} 2001 Scandinavia, 7th European Conference on Speech Communication
                  and Technology, 2nd {INTERSPEECH} Event, Aalborg, Denmark, September
                  3-7, 2001},
  pages        = {349--352},
  publisher    = {{ISCA}},
  year         = {2001},
  url          = {https://doi.org/10.21437/Eurospeech.2001-108},
  doi          = {10.21437/EUROSPEECH.2001-108},
  timestamp    = {Thu, 22 Jun 2023 16:42:18 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/TodaSS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/YamadaBYMLSS01,
  author       = {Miichi Yamada and
                  Akira Baba and
                  Shinichi Yoshizawa and
                  Yuichiro Mera and
                  Akinobu Lee and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Paul Dalsgaard and
                  B{\o}rge Lindberg and
                  Henrik Benner and
                  Zheng{-}Hua Tan},
  title        = {Unsupervised noisy environment adaptation algorithm using {MLLR} and
                  speaker selection},
  booktitle    = {{EUROSPEECH} 2001 Scandinavia, 7th European Conference on Speech Communication
                  and Technology, 2nd {INTERSPEECH} Event, Aalborg, Denmark, September
                  3-7, 2001},
  pages        = {869--872},
  publisher    = {{ISCA}},
  year         = {2001},
  url          = {https://doi.org/10.21437/Eurospeech.2001-265},
  doi          = {10.21437/EUROSPEECH.2001-265},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/YamadaBYMLSS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/NisimuraKKNLSS01,
  author       = {Ryuichi Nisimura and
                  Kumiko Komatsu and
                  Yuka Kuroda and
                  Kentaro Nagatomo and
                  Akinobu Lee and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  editor       = {Paul Dalsgaard and
                  B{\o}rge Lindberg and
                  Henrik Benner and
                  Zheng{-}Hua Tan},
  title        = {Automatic n-gram language model creation from web resources},
  booktitle    = {{EUROSPEECH} 2001 Scandinavia, 7th European Conference on Speech Communication
                  and Technology, 2nd {INTERSPEECH} Event, Aalborg, Denmark, September
                  3-7, 2001},
  pages        = {2127--2130},
  publisher    = {{ISCA}},
  year         = {2001},
  url          = {https://doi.org/10.21437/Eurospeech.2001-501},
  doi          = {10.21437/EUROSPEECH.2001-501},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/NisimuraKKNLSS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ArakiMMS01,
  author       = {Shoko Araki and
                  Shoji Makino and
                  Ryo Mukai and
                  Hiroshi Saruwatari},
  editor       = {Paul Dalsgaard and
                  B{\o}rge Lindberg and
                  Henrik Benner and
                  Zheng{-}Hua Tan},
  title        = {Equivalence between frequency domain blind source separation and frequency
                  domain adaptive null beamformers},
  booktitle    = {{EUROSPEECH} 2001 Scandinavia, 7th European Conference on Speech Communication
                  and Technology, 2nd {INTERSPEECH} Event, Aalborg, Denmark, September
                  3-7, 2001},
  pages        = {2595--2598},
  publisher    = {{ISCA}},
  year         = {2001},
  url          = {https://doi.org/10.21437/Eurospeech.2001-607},
  doi          = {10.21437/EUROSPEECH.2001-607},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ArakiMMS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SaruwatariKS01,
  author       = {Hiroshi Saruwatari and
                  Toshiya Kawamura and
                  Kiyohiro Shikano},
  editor       = {Paul Dalsgaard and
                  B{\o}rge Lindberg and
                  Henrik Benner and
                  Zheng{-}Hua Tan},
  title        = {Blind source separation for speech based on fast-convergence algorithm
                  with {ICA} and beamforming},
  booktitle    = {{EUROSPEECH} 2001 Scandinavia, 7th European Conference on Speech Communication
                  and Technology, 2nd {INTERSPEECH} Event, Aalborg, Denmark, September
                  3-7, 2001},
  pages        = {2603--2606},
  publisher    = {{ISCA}},
  year         = {2001},
  url          = {https://doi.org/10.21437/Eurospeech.2001-609},
  doi          = {10.21437/EUROSPEECH.2001-609},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SaruwatariKS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eusipco/SaruwatariKTI00,
  author       = {Hiroshi Saruwatari and
                  Shoji Kajita and
                  Kazuya Takeda and
                  Fumitada Itakura},
  title        = {Speech enhancement based on noise adaptive nonlinear microphone array},
  booktitle    = {10th European Signal Processing Conference, {EUSIPCO} 2000, Tampere,
                  Finland, September 4-8, 2000},
  pages        = {1--4},
  publisher    = {{IEEE}},
  year         = {2000},
  url          = {https://ieeexplore.ieee.org/document/7075316/},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eusipco/SaruwatariKTI00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SaruwatariKTI00,
  author       = {Hiroshi Saruwatari and
                  Shoji Kajita and
                  Kazuya Takeda and
                  Fumitada Itakura},
  title        = {Speech enhancement using nonlinear microphone array with noise adaptive
                  complementary beamforming},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing.
                  {ICASSP} 2000, 5-9 June, 2000, Hilton Hotel and Convention Center,
                  Istanbul, Turkey},
  pages        = {1049--1052},
  publisher    = {{IEEE}},
  year         = {2000},
  url          = {https://doi.org/10.1109/ICASSP.2000.859143},
  doi          = {10.1109/ICASSP.2000.859143},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/SaruwatariKTI00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KuritaSKTI00,
  author       = {Satoshi Kurita and
                  Hiroshi Saruwatari and
                  Shoji Kajita and
                  Kazuya Takeda and
                  Fumitada Itakura},
  title        = {Evaluation of blind signal separation method using directivity pattern
                  under reverberant conditions},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing.
                  {ICASSP} 2000, 5-9 June, 2000, Hilton Hotel and Convention Center,
                  Istanbul, Turkey},
  pages        = {3140--3143},
  publisher    = {{IEEE}},
  year         = {2000},
  url          = {https://doi.org/10.1109/ICASSP.2000.861203},
  doi          = {10.1109/ICASSP.2000.861203},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/KuritaSKTI00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SaruwatariKTIS00,
  author       = {Hiroshi Saruwatari and
                  Satoshi Kurita and
                  Kazuya Takeda and
                  Fumitada Itakura and
                  Kiyohiro Shikano},
  title        = {Blind source separation based on subband {ICA} and beamforming},
  booktitle    = {Sixth International Conference on Spoken Language Processing, {ICSLP}
                  2000 / {INTERSPEECH} 2000, Beijing, China, October 16-20, 2000},
  pages        = {94--97},
  publisher    = {{ISCA}},
  year         = {2000},
  url          = {https://doi.org/10.21437/ICSLP.2000-486},
  doi          = {10.21437/ICSLP.2000-486},
  timestamp    = {Thu, 22 Jun 2023 16:42:19 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SaruwatariKTIS00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/TodaLSS00,
  author       = {Tomoki Toda and
                  Jinlin Lu and
                  Hiroshi Saruwatari and
                  Kiyohiro Shikano},
  title        = {Straight-based voice conversion algorithm based on Gaussian mixture
                  model},
  booktitle    = {Sixth International Conference on Spoken Language Processing, {ICSLP}
                  2000 / {INTERSPEECH} 2000, Beijing, China, October 16-20, 2000},
  pages        = {279--282},
  publisher    = {{ISCA}},
  year         = {2000},
  url          = {https://doi.org/10.21437/ICSLP.2000-532},
  doi          = {10.21437/ICSLP.2000-532},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/TodaLSS00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SaruwatariKTI99,
  author       = {Hiroshi Saruwatari and
                  Shoji Kajita and
                  Kazuya Takeda and
                  Fumitada Itakura},
  title        = {Speech enhancement using nonlinear microphone array with complementary
                  beamforming},
  booktitle    = {Proceedings of the 1999 {IEEE} International Conference on Acoustics,
                  Speech, and Signal Processing, {ICASSP} '99, Phoenix, Arizona, USA,
                  March 15-19, 1999},
  pages        = {69--72},
  publisher    = {{IEEE} Computer Society},
  year         = {1999},
  url          = {https://doi.org/10.1109/ICASSP.1999.758064},
  doi          = {10.1109/ICASSP.1999.758064},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/SaruwatariKTI99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/OmuraYSKTI99,
  author       = {Michiaki Omura and
                  Motohiko Yada and
                  Hiroshi Saruwatari and
                  Shoji Kajita and
                  Kazuya Takeda and
                  Fumitada Itakura},
  title        = {Compensating of room acoustic transfer functions affected by change
                  of room temperature},
  booktitle    = {Proceedings of the 1999 {IEEE} International Conference on Acoustics,
                  Speech, and Signal Processing, {ICASSP} '99, Phoenix, Arizona, USA,
                  March 15-19, 1999},
  pages        = {941--944},
  publisher    = {{IEEE} Computer Society},
  year         = {1999},
  url          = {https://doi.org/10.1109/ICASSP.1999.759827},
  doi          = {10.1109/ICASSP.1999.759827},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/OmuraYSKTI99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SaruwatariKTI99,
  author       = {Hiroshi Saruwatari and
                  Shoji Kajita and
                  Kazuya Takeda and
                  Fumitada Itakura},
  title        = {Speech enhancement using nonlinear microphone array under nonstationary
                  noise conditions},
  booktitle    = {Sixth European Conference on Speech Communication and Technology,
                  {EUROSPEECH} 1999, Budapest, Hungary, September 5-9, 1999},
  pages        = {2567--2570},
  publisher    = {{ISCA}},
  year         = {1999},
  url          = {https://doi.org/10.21437/Eurospeech.1999-564},
  doi          = {10.21437/EUROSPEECH.1999-564},
  timestamp    = {Sat, 01 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SaruwatariKTI99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics