BibTeX records: Vincent Wan

download as .bib file

@inproceedings{DBLP:conf/interspeech/FinkelsteinZCCJ22,
  author       = {Lev Finkelstein and
                  Heiga Zen and
                  Norman Casagrande and
                  Chun{-}an Chan and
                  Ye Jia and
                  Tom Kenter and
                  Alexey Petelin and
                  Jonathan Shen and
                  Vincent Wan and
                  Yu Zhang and
                  Yonghui Wu and
                  Rob Clark},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {Training Text-To-Speech Systems From Synthetic Data: {A} Practical
                  Approach For Accent Transfer Tasks},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {4571--4575},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-10115},
  doi          = {10.21437/INTERSPEECH.2022-10115},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/FinkelsteinZCCJ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-13183,
  author       = {Lev Finkelstein and
                  Heiga Zen and
                  Norman Casagrande and
                  Chun{-}an Chan and
                  Ye Jia and
                  Tom Kenter and
                  Alexey Petelin and
                  Jonathan Shen and
                  Vincent Wan and
                  Yu Zhang and
                  Yonghui Wu and
                  Rob Clark},
  title        = {Training Text-To-Speech Systems From Synthetic Data: {A} Practical
                  Approach For Accent Transfer Tasks},
  journal      = {CoRR},
  volume       = {abs/2208.13183},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.13183},
  doi          = {10.48550/ARXIV.2208.13183},
  eprinttype    = {arXiv},
  eprint       = {2208.13183},
  timestamp    = {Wed, 25 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-13183.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KenterWCCV19,
  author       = {Tom Kenter and
                  Vincent Wan and
                  Chun{-}an Chan and
                  Rob Clark and
                  Jakub Vit},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {CHiVE: Varying Prosody in Speech Synthesis with a Linguistically Driven
                  Dynamic Hierarchical Conditional Variational Network},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {3331--3340},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/kenter19a.html},
  timestamp    = {Tue, 11 Jun 2019 15:37:38 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/KenterWCCV19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-07195,
  author       = {Vincent Wan and
                  Chun{-}an Chan and
                  Tom Kenter and
                  Jakub Vit and
                  Rob Clark},
  title        = {CHiVE: Varying Prosody in Speech Synthesis with a Linguistically Driven
                  Dynamic Hierarchical Conditional Variational Network},
  journal      = {CoRR},
  volume       = {abs/1905.07195},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.07195},
  eprinttype    = {arXiv},
  eprint       = {1905.07195},
  timestamp    = {Tue, 28 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-07195.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/WanASV17,
  author       = {Vincent Wan and
                  Yannis Agiomyrgiannakis and
                  Hanna Sil{\'{e}}n and
                  Jakub V{\'{\i}}t},
  editor       = {Francisco Lacerda},
  title        = {Google's Next-Generation Real-Time Unit-Selection Synthesizer Using
                  Sequence-to-Sequence LSTM-Based Autoencoders},
  booktitle    = {Interspeech 2017, 18th Annual Conference of the International Speech
                  Communication Association, Stockholm, Sweden, August 20-24, 2017},
  pages        = {1143--1147},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-1107},
  doi          = {10.21437/INTERSPEECH.2017-1107},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/WanASV17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cviu/CassidySDYAWBC16,
  author       = {Sarah A. Cassidy and
                  Bj{\"{o}}rn Stenger and
                  L. Van Dongen and
                  Kayoko Yanagisawa and
                  Robert Anderson and
                  Vincent Wan and
                  Simon Baron{-}Cohen and
                  Roberto Cipolla},
  title        = {Expressive visual text-to-speech as an assistive technology for individuals
                  with autism spectrum conditions},
  journal      = {Comput. Vis. Image Underst.},
  volume       = {148},
  pages        = {193--200},
  year         = {2016},
  url          = {https://doi.org/10.1016/j.cviu.2015.08.011},
  doi          = {10.1016/J.CVIU.2015.08.011},
  timestamp    = {Thu, 01 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/cviu/CassidySDYAWBC16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jstsp/WanLYBCGA14,
  author       = {Vincent Wan and
                  Javier Latorre and
                  Kayoko Yanagisawa and
                  Norbert Braunschweiler and
                  Langzhou Chen and
                  Mark J. F. Gales and
                  Masami Akamine},
  title        = {Building {HMM-TTS} Voices on Diverse Data},
  journal      = {{IEEE} J. Sel. Top. Signal Process.},
  volume       = {8},
  number       = {2},
  pages        = {296--306},
  year         = {2014},
  url          = {https://doi.org/10.1109/JSTSP.2013.2295058},
  doi          = {10.1109/JSTSP.2013.2295058},
  timestamp    = {Thu, 09 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jstsp/WanLYBCGA14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/WanLYGS14,
  author       = {Vincent Wan and
                  Javier Latorre and
                  Kayoko Yanagisawa and
                  Mark J. F. Gales and
                  Yannis Stylianou},
  title        = {Cluster adaptive training of average voice models},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2014, Florence, Italy, May 4-9, 2014},
  pages        = {280--284},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ICASSP.2014.6853602},
  doi          = {10.1109/ICASSP.2014.6853602},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/WanLYGS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ChenGKBCCW14,
  author       = {Xie Chen and
                  Mark J. F. Gales and
                  Kate M. Knill and
                  Catherine Breslin and
                  Langzhou Chen and
                  K. K. Chin and
                  Vincent Wan},
  editor       = {Haizhou Li and
                  Helen M. Meng and
                  Bin Ma and
                  Engsiong Chng and
                  Lei Xie},
  title        = {An initial investigation of long-term adaptation for meeting transcription},
  booktitle    = {{INTERSPEECH} 2014, 15th Annual Conference of the International Speech
                  Communication Association, Singapore, September 14-18, 2014},
  pages        = {954--958},
  publisher    = {{ISCA}},
  year         = {2014},
  url          = {https://doi.org/10.21437/Interspeech.2014-253},
  doi          = {10.21437/INTERSPEECH.2014-253},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ChenGKBCCW14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/KolluruWLYG14,
  author       = {BalaKrishna Kolluru and
                  Vincent Wan and
                  Javier Latorre and
                  Kayoko Yanagisawa and
                  Mark J. F. Gales},
  editor       = {Haizhou Li and
                  Helen M. Meng and
                  Bin Ma and
                  Engsiong Chng and
                  Lei Xie},
  title        = {Generating multiple-accent pronunciations for {TTS} using joint sequence
                  model interpolation},
  booktitle    = {{INTERSPEECH} 2014, 15th Annual Conference of the International Speech
                  Communication Association, Singapore, September 14-18, 2014},
  pages        = {1273--1277},
  publisher    = {{ISCA}},
  year         = {2014},
  url          = {https://doi.org/10.21437/Interspeech.2014-318},
  doi          = {10.21437/INTERSPEECH.2014-318},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/KolluruWLYG14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LatorreWY14,
  author       = {Javier Latorre and
                  Vincent Wan and
                  Kayoko Yanagisawa},
  editor       = {Haizhou Li and
                  Helen M. Meng and
                  Bin Ma and
                  Engsiong Chng and
                  Lei Xie},
  title        = {Voice expression conversion with factorised {HMM-TTS} models},
  booktitle    = {{INTERSPEECH} 2014, 15th Annual Conference of the International Speech
                  Communication Association, Singapore, September 14-18, 2014},
  pages        = {1514--1518},
  publisher    = {{ISCA}},
  year         = {2014},
  url          = {https://doi.org/10.21437/Interspeech.2014-363},
  doi          = {10.21437/INTERSPEECH.2014-363},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/LatorreWY14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LatorreYWKG14,
  author       = {Javier Latorre and
                  Kayoko Yanagisawa and
                  Vincent Wan and
                  BalaKrishna Kolluru and
                  Mark J. F. Gales},
  editor       = {Haizhou Li and
                  Helen M. Meng and
                  Bin Ma and
                  Engsiong Chng and
                  Lei Xie},
  title        = {Speech intonation for {TTS:} study on evaluation methodology},
  booktitle    = {{INTERSPEECH} 2014, 15th Annual Conference of the International Speech
                  Communication Association, Singapore, September 14-18, 2014},
  pages        = {2957--2961},
  publisher    = {{ISCA}},
  year         = {2014},
  url          = {https://doi.org/10.21437/Interspeech.2014-204},
  doi          = {10.21437/INTERSPEECH.2014-204},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/LatorreYWKG14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/AndersonSWC13,
  author       = {Robert Anderson and
                  Bj{\"{o}}rn Stenger and
                  Vincent Wan and
                  Roberto Cipolla},
  title        = {Expressive Visual Text-to-Speech Using Active Appearance Models},
  booktitle    = {2013 {IEEE} Conference on Computer Vision and Pattern Recognition,
                  Portland, OR, USA, June 23-28, 2013},
  pages        = {3382--3389},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/CVPR.2013.434},
  doi          = {10.1109/CVPR.2013.434},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/AndersonSWC13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/WanABBCKLMSYSAGC13,
  author       = {Vincent Wan and
                  Robert Anderson and
                  Art Blokland and
                  Norbert Braunschweiler and
                  Langzhou Chen and
                  BalaKrishna Kolluru and
                  Javier Latorre and
                  Ranniery Maia and
                  Bj{\"{o}}rn Stenger and
                  Kayoko Yanagisawa and
                  Yannis Stylianou and
                  Masami Akamine and
                  Mark J. F. Gales and
                  Roberto Cipolla},
  editor       = {Fr{\'{e}}d{\'{e}}ric Bimbot and
                  Christophe Cerisara and
                  C{\'{e}}cile Fougeron and
                  Guillaume Gravier and
                  Lori Lamel and
                  Fran{\c{c}}ois Pellegrino and
                  Pascal Perrier},
  title        = {Photo-realistic expressive text to talking head synthesis},
  booktitle    = {{INTERSPEECH} 2013, 14th Annual Conference of the International Speech
                  Communication Association, Lyon, France, August 25-29, 2013},
  pages        = {2667--2669},
  publisher    = {{ISCA}},
  year         = {2013},
  url          = {https://www.isca-speech.org/archive/interspeech\_2013/wan13\_interspeech.html},
  timestamp    = {Tue, 27 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/WanABBCKLMSYSAGC13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/siggraph/AndersonSWC13,
  author       = {Robert Anderson and
                  Bj{\"{o}}rn Stenger and
                  Vincent Wan and
                  Roberto Cipolla},
  title        = {An expressive text-driven 3D talking head},
  booktitle    = {Special Interest Group on Computer Graphics and Interactive Techniques
                  Conference, {SIGGRAPH} '13, Anaheim, CA, USA, July 21-25, 2013, Poster
                  Proceedings},
  pages        = {80},
  publisher    = {{ACM}},
  year         = {2013},
  url          = {https://doi.org/10.1145/2503385.2503473},
  doi          = {10.1145/2503385.2503473},
  timestamp    = {Fri, 12 Mar 2021 10:43:26 +0100},
  biburl       = {https://dblp.org/rec/conf/siggraph/AndersonSWC13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/YanagisawaLWGK13,
  author       = {Kayoko Yanagisawa and
                  Javier Latorre and
                  Vincent Wan and
                  Mark J. F. Gales and
                  Simon King},
  title        = {Noise robustness in {HMM-TTS} speaker adaptation},
  booktitle    = {The Eighth {ISCA} Tutorial and Research Workshop on Speech Synthesis,
                  Barcelona, Spain, August 31-September 2, 2013},
  pages        = {119--124},
  publisher    = {{ISCA}},
  year         = {2013},
  url          = {http://www.isca-speech.org/archive/ssw8/ssw8\_119.html},
  timestamp    = {Sat, 03 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ssw/YanagisawaLWGK13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/HainBDGGHHKLW12,
  author       = {Thomas Hain and
                  Luk{\'{a}}s Burget and
                  John Dines and
                  Philip N. Garner and
                  Frantisek Gr{\'{e}}zl and
                  Asmaa El Hannani and
                  Marijn Huijbregts and
                  Martin Karafi{\'{a}}t and
                  Mike Lincoln and
                  Vincent Wan},
  title        = {Transcribing Meetings With the {AMIDA} Systems},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {20},
  number       = {2},
  pages        = {486--498},
  year         = {2012},
  url          = {https://doi.org/10.1109/TASL.2011.2163395},
  doi          = {10.1109/TASL.2011.2163395},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/HainBDGGHHKLW12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/EybenBBLWGK12,
  author       = {Florian Eyben and
                  Sabine Buchholz and
                  Norbert Braunschweiler and
                  Javier Latorre and
                  Vincent Wan and
                  Mark J. F. Gales and
                  Kate Knill},
  title        = {Unsupervised clustering of emotion and voice styles for expressive
                  {TTS}},
  booktitle    = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
  pages        = {4009--4012},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICASSP.2012.6288797},
  doi          = {10.1109/ICASSP.2012.6288797},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/EybenBBLWGK12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ChenGWLA12,
  author       = {Langzhou Chen and
                  Mark J. F. Gales and
                  Vincent Wan and
                  Javier Latorre and
                  Masami Akamine},
  title        = {Exploring Rich Expressive Information from Audiobook Data Using Cluster
                  Adaptive Training},
  booktitle    = {{INTERSPEECH} 2012, 13th Annual Conference of the International Speech
                  Communication Association, Portland, Oregon, USA, September 9-13,
                  2012},
  pages        = {959--962},
  publisher    = {{ISCA}},
  year         = {2012},
  url          = {https://doi.org/10.21437/Interspeech.2012-286},
  doi          = {10.21437/INTERSPEECH.2012-286},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ChenGWLA12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LatorreWGCCKA12,
  author       = {Javier Latorre and
                  Vincent Wan and
                  Mark J. F. Gales and
                  Langzhou Chen and
                  K. K. Chin and
                  Kate Knill and
                  Masami Akamine},
  title        = {Speech factorization for {HMM-TTS} based on cluster adaptive training},
  booktitle    = {{INTERSPEECH} 2012, 13th Annual Conference of the International Speech
                  Communication Association, Portland, Oregon, USA, September 9-13,
                  2012},
  pages        = {971--974},
  publisher    = {{ISCA}},
  year         = {2012},
  url          = {https://doi.org/10.21437/Interspeech.2012-289},
  doi          = {10.21437/INTERSPEECH.2012-289},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/LatorreWGCCKA12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/WanLCCGZKA12,
  author       = {Vincent Wan and
                  Javier Latorre and
                  K. K. Chin and
                  Langzhou Chen and
                  Mark J. F. Gales and
                  Heiga Zen and
                  Kate Knill and
                  Masami Akamine},
  title        = {Combining multiple high quality corpora for improving {HMM-TTS}},
  booktitle    = {{INTERSPEECH} 2012, 13th Annual Conference of the International Speech
                  Communication Association, Portland, Oregon, USA, September 9-13,
                  2012},
  pages        = {1135--1138},
  publisher    = {{ISCA}},
  year         = {2012},
  url          = {https://doi.org/10.21437/Interspeech.2012-357},
  doi          = {10.21437/INTERSPEECH.2012-357},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/WanLCCGZKA12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/TuckerFWWH11,
  author       = {Roger C. F. Tucker and
                  Dan Fry and
                  Vincent Wan and
                  Stuart N. Wrigley and
                  Thomas Hain},
  title        = {Extending Audio Notetaker to Browse WebASR Transcriptions},
  booktitle    = {{INTERSPEECH} 2011, 12th Annual Conference of the International Speech
                  Communication Association, Florence, Italy, August 27-31, 2011},
  pages        = {3329--3330},
  publisher    = {{ISCA}},
  year         = {2011},
  url          = {https://www.isca-speech.org/archive/interspeech\_2011/tucker11\_interspeech.html},
  timestamp    = {Tue, 27 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/TuckerFWWH11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HainBDGHHKLW10,
  author       = {Thomas Hain and
                  Luk{\'{a}}s Burget and
                  John Dines and
                  Philip N. Garner and
                  Asmaa El Hannani and
                  Marijn Huijbregts and
                  Martin Karafi{\'{a}}t and
                  Mike Lincoln and
                  Vincent Wan},
  editor       = {Takao Kobayashi and
                  Keikichi Hirose and
                  Satoshi Nakamura},
  title        = {The {AMIDA} 2009 meeting transcription system},
  booktitle    = {{INTERSPEECH} 2010, 11th Annual Conference of the International Speech
                  Communication Association, Makuhari, Chiba, Japan, September 26-30,
                  2010},
  pages        = {358--361},
  publisher    = {{ISCA}},
  year         = {2010},
  url          = {https://doi.org/10.21437/Interspeech.2010-130},
  doi          = {10.21437/INTERSPEECH.2010-130},
  timestamp    = {Sun, 06 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HainBDGHHKLW10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/GarnerDHHKKLWZ09,
  author       = {Philip N. Garner and
                  John Dines and
                  Thomas Hain and
                  Asmaa El Hannani and
                  Martin Karafi{\'{a}}t and
                  Danil Korchagin and
                  Mike Lincoln and
                  Vincent Wan and
                  Le Zhang},
  title        = {Real-time {ASR} from meetings},
  booktitle    = {{INTERSPEECH} 2009, 10th Annual Conference of the International Speech
                  Communication Association, Brighton, United Kingdom, September 6-10,
                  2009},
  pages        = {2119--2122},
  publisher    = {{ISCA}},
  year         = {2009},
  url          = {https://doi.org/10.21437/Interspeech.2009-606},
  doi          = {10.21437/INTERSPEECH.2009-606},
  timestamp    = {Sun, 06 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/GarnerDHHKKLWZ09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HainHWW08,
  author       = {Thomas Hain and
                  Asmaa El Hannani and
                  Stuart N. Wrigley and
                  Vincent Wan},
  title        = {Automatic speech recognition for scientific purposes - webASR},
  booktitle    = {{INTERSPEECH} 2008, 9th Annual Conference of the International Speech
                  Communication Association, Brisbane, Australia, September 22-26, 2008},
  pages        = {504--507},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-86},
  doi          = {10.21437/INTERSPEECH.2008-86},
  timestamp    = {Sun, 06 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HainHWW08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/CarmichaelWG08,
  author       = {James Carmichael and
                  Vincent Wan and
                  Phil D. Green},
  title        = {Combining neural network and rule-based systems for dysarthria diagnosis},
  booktitle    = {{INTERSPEECH} 2008, 9th Annual Conference of the International Speech
                  Communication Association, Brisbane, Australia, September 22-26, 2008},
  pages        = {2226--2229},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-581},
  doi          = {10.21437/INTERSPEECH.2008-581},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/CarmichaelWG08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/WanDHH08,
  author       = {Vincent Wan and
                  John Dines and
                  Asmaa El Hannani and
                  Thomas Hain},
  editor       = {Amitava Das and
                  Srinivas Bangalore},
  title        = {Bob: {A} lexicon and pronunciation dictionary generator},
  booktitle    = {2008 {IEEE} Spoken Language Technology Workshop, {SLT} 2008, Goa,
                  India, December 15-19, 2008},
  pages        = {217--220},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/SLT.2008.4777879},
  doi          = {10.1109/SLT.2008.4777879},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/slt/WanDHH08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/speech/ScharenborgWM07,
  author       = {Odette Scharenborg and
                  Vincent Wan and
                  Roger K. Moore},
  title        = {Towards capturing fine phonetic variation in speech using articulatory
                  features},
  journal      = {Speech Commun.},
  volume       = {49},
  number       = {10-11},
  pages        = {811--826},
  year         = {2007},
  url          = {https://doi.org/10.1016/j.specom.2007.01.005},
  doi          = {10.1016/J.SPECOM.2007.01.005},
  timestamp    = {Tue, 29 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/speech/ScharenborgWM07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/clear/HainBDGKLLW07,
  author       = {Thomas Hain and
                  Luk{\'{a}}s Burget and
                  John Dines and
                  Giulia Garau and
                  Martin Karafi{\'{a}}t and
                  David A. van Leeuwen and
                  Mike Lincoln and
                  Vincent Wan},
  editor       = {Rainer Stiefelhagen and
                  Rachel Bowers and
                  Jonathan G. Fiscus},
  title        = {The 2007 {AMI(DA)} System for Meeting Transcription},
  booktitle    = {Multimodal Technologies for Perception of Humans, International Evaluation
                  Workshops {CLEAR} 2007 and {RT} 2007, Baltimore, MD, USA, May 8-11,
                  2007, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {4625},
  pages        = {414--428},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-68585-2\_39},
  doi          = {10.1007/978-3-540-68585-2\_39},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/clear/HainBDGKLLW07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HainWBKDVGL07,
  author       = {Thomas Hain and
                  Vincent Wan and
                  Luk{\'{a}}s Burget and
                  Martin Karafi{\'{a}}t and
                  John Dines and
                  Jithendra Vepa and
                  Giulia Garau and
                  Mike Lincoln},
  title        = {The {AMI} System for the Transcription of Speech in Meetings},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2007, Honolulu, Hawaii, USA, April
                  15-20, 2007},
  pages        = {357--360},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ICASSP.2007.366923},
  doi          = {10.1109/ICASSP.2007.366923},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/HainWBKDVGL07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/Pereiro-EstevanWS07,
  author       = {Yago Pereiro{-}Estevan and
                  Vincent Wan and
                  Odette Scharenborg},
  title        = {Finding Maximum Margin Segments in Speech},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2007, Honolulu, Hawaii, USA, April
                  15-20, 2007},
  pages        = {937--940},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ICASSP.2007.367225},
  doi          = {10.1109/ICASSP.2007.367225},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/Pereiro-EstevanWS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ScharenborgEW07,
  author       = {Odette Scharenborg and
                  Mirjam Ernestus and
                  Vincent Wan},
  title        = {Segmentation of speech: child's play?},
  booktitle    = {{INTERSPEECH} 2007, 8th Annual Conference of the International Speech
                  Communication Association, Antwerp, Belgium, August 27-31, 2007},
  pages        = {1953--1956},
  publisher    = {{ISCA}},
  year         = {2007},
  url          = {https://doi.org/10.21437/Interspeech.2007-47},
  doi          = {10.21437/INTERSPEECH.2007-47},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ScharenborgEW07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ScharenborgW07,
  author       = {Odette Scharenborg and
                  Vincent Wan},
  title        = {Can unquantised articulatory feature continuums be modelled?},
  booktitle    = {{INTERSPEECH} 2007, 8th Annual Conference of the International Speech
                  Communication Association, Antwerp, Belgium, August 27-31, 2007},
  pages        = {2473--2476},
  publisher    = {{ISCA}},
  year         = {2007},
  url          = {https://doi.org/10.21437/Interspeech.2007-658},
  doi          = {10.21437/INTERSPEECH.2007-658},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ScharenborgW07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/WanH06,
  author       = {Vincent Wan and
                  Thomas Hain},
  title        = {Strategies for Language Model Web-Data Collection},
  booktitle    = {2006 {IEEE} International Conference on Acoustics Speech and Signal
                  Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
  pages        = {1069--1072},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/ICASSP.2006.1660209},
  doi          = {10.1109/ICASSP.2006.1660209},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/WanH06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mlmi/HainBDGKLVW06,
  author       = {Thomas Hain and
                  Luk{\'{a}}s Burget and
                  John Dines and
                  Giulia Garau and
                  Martin Karafi{\'{a}}t and
                  Mike Lincoln and
                  Jithendra Vepa and
                  Vincent Wan},
  editor       = {Steve Renals and
                  Samy Bengio and
                  Jonathan G. Fiscus},
  title        = {The {AMI} Meeting Transcription System: Progress and Performance},
  booktitle    = {Machine Learning for Multimodal Interaction, Third International Workshop,
                  {MLMI} 2006, Bethesda, MD, USA, May 1-4, 2006, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {4299},
  pages        = {419--431},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/11965152\_37},
  doi          = {10.1007/11965152\_37},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/mlmi/HainBDGKLVW06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/WrigleyBWR05,
  author       = {Stuart N. Wrigley and
                  Guy J. Brown and
                  Vincent Wan and
                  Steve Renals},
  title        = {Speech and crosstalk detection in multichannel audio},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {13},
  number       = {1},
  pages        = {84--91},
  year         = {2005},
  url          = {https://doi.org/10.1109/TSA.2004.838531},
  doi          = {10.1109/TSA.2004.838531},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/WrigleyBWR05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/WanR05,
  author       = {Vincent Wan and
                  Steve Renals},
  title        = {Speaker verification using sequence discriminant support vector machines},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {13},
  number       = {2},
  pages        = {203--210},
  year         = {2005},
  url          = {https://doi.org/10.1109/TSA.2004.841042},
  doi          = {10.1109/TSA.2004.841042},
  timestamp    = {Sun, 17 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/WanR05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HainDGKMWOR05,
  author       = {Thomas Hain and
                  John Dines and
                  Giulia Garau and
                  Martin Karafi{\'{a}}t and
                  Darren Moore and
                  Vincent Wan and
                  Roeland Ordelman and
                  Steve Renals},
  title        = {Transcription of conference room meetings: an investigation},
  booktitle    = {{INTERSPEECH} 2005 - Eurospeech, 9th European Conference on Speech
                  Communication and Technology, Lisbon, Portugal, September 4-8, 2005},
  pages        = {1661--1664},
  publisher    = {{ISCA}},
  year         = {2005},
  url          = {https://doi.org/10.21437/Interspeech.2005-543},
  doi          = {10.21437/INTERSPEECH.2005-543},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HainDGKMWOR05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/WanC05,
  author       = {Vincent Wan and
                  James Carmichael},
  title        = {Polynomial dynamic time warping kernel support vector machines for
                  dysarthric speech recognition with sparse training data},
  booktitle    = {{INTERSPEECH} 2005 - Eurospeech, 9th European Conference on Speech
                  Communication and Technology, Lisbon, Portugal, September 4-8, 2005},
  pages        = {3321--3324},
  publisher    = {{ISCA}},
  year         = {2005},
  url          = {https://doi.org/10.21437/Interspeech.2005-853},
  doi          = {10.21437/INTERSPEECH.2005-853},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/WanC05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mlmi/HainBDMGKLMWOR05,
  author       = {Thomas Hain and
                  Luk{\'{a}}s Burget and
                  John Dines and
                  Iain McCowan and
                  Giulia Garau and
                  Martin Karafi{\'{a}}t and
                  Mike Lincoln and
                  Darren Moore and
                  Vincent Wan and
                  Roeland Ordelman and
                  Steve Renals},
  editor       = {Steve Renals and
                  Samy Bengio},
  title        = {The Development of the {AMI} System for the Transcription of Speech
                  in Meetings},
  booktitle    = {Machine Learning for Multimodal Interaction, Second International
                  Workshop, {MLMI} 2005, Edinburgh, UK, July 11-13, 2005, Revised Selected
                  Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {3869},
  pages        = {344--356},
  publisher    = {Springer},
  year         = {2005},
  url          = {https://doi.org/10.1007/11677482\_30},
  doi          = {10.1007/11677482\_30},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/mlmi/HainBDMGKLMWOR05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mlmi/HainBDGKLMMWOR05,
  author       = {Thomas Hain and
                  Luk{\'{a}}s Burget and
                  John Dines and
                  Giulia Garau and
                  Martin Karafi{\'{a}}t and
                  Mike Lincoln and
                  Iain McCowan and
                  Darren Moore and
                  Vincent Wan and
                  Roeland Ordelman and
                  Steve Renals},
  editor       = {Steve Renals and
                  Samy Bengio},
  title        = {The 2005 {AMI} System for the Transcription of Speech in Meetings},
  booktitle    = {Machine Learning for Multimodal Interaction, Second International
                  Workshop, {MLMI} 2005, Edinburgh, UK, July 11-13, 2005, Revised Selected
                  Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {3869},
  pages        = {450--462},
  publisher    = {Springer},
  year         = {2005},
  url          = {https://doi.org/10.1007/11677482\_38},
  doi          = {10.1007/11677482\_38},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/mlmi/HainBDGKLMMWOR05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@phdthesis{DBLP:phd/ethos/Wan03,
  author       = {Vincent Wan},
  title        = {Speaker verification using support vector machines},
  school       = {University of Sheffield, {UK}},
  year         = {2003},
  url          = {https://ethos.bl.uk/OrderDetails.do?uin=uk.bl.ethos.398619},
  timestamp    = {Tue, 05 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/phd/ethos/Wan03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/WanR03,
  author       = {Vincent Wan and
                  Steve Renals},
  title        = {{SVMSVM:} support vector machine speaker verification methodology},
  booktitle    = {2003 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} '03, Hong Kong, April 6-10, 2003},
  pages        = {221--224},
  publisher    = {{IEEE}},
  year         = {2003},
  url          = {https://doi.org/10.1109/ICASSP.2003.1202334},
  doi          = {10.1109/ICASSP.2003.1202334},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/WanR03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/WrigleyBWR03,
  author       = {Stuart N. Wrigley and
                  Guy J. Brown and
                  Vincent Wan and
                  Steve Renals},
  title        = {Feature selection for the classification of crosstalk in multi-channel
                  audio},
  booktitle    = {8th European Conference on Speech Communication and Technology, {EUROSPEECH}
                  2003 - {INTERSPEECH} 2003, Geneva, Switzerland, September 1-4, 2003},
  pages        = {469--472},
  publisher    = {{ISCA}},
  year         = {2003},
  url          = {https://doi.org/10.21437/Eurospeech.2003-172},
  doi          = {10.21437/EUROSPEECH.2003-172},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/WrigleyBWR03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/WanR02,
  author       = {Vincent Wan and
                  Steve Renals},
  title        = {Evaluation of kernel methods for speaker verification and identification},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2002, May 13-17 2002, Orlando, Florida,
                  {USA}},
  pages        = {669--672},
  publisher    = {{IEEE}},
  year         = {2002},
  url          = {https://doi.org/10.1109/ICASSP.2002.5743806},
  doi          = {10.1109/ICASSP.2002.5743806},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/WanR02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/mima/BratmanHWM92,
  author       = {Michael E. Bratman and
                  Brian Harvey and
                  Vincent Wan and
                  Alice ter Meulen},
  title        = {Book reviews},
  journal      = {Minds Mach.},
  volume       = {2},
  number       = {2},
  pages        = {203--215},
  year         = {1992},
  url          = {https://doi.org/10.1007/BF00704458},
  doi          = {10.1007/BF00704458},
  timestamp    = {Mon, 11 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/mima/BratmanHWM92.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics