default search action

combined dblp search
author search
venue search
publication search

ask others

BibTeX records: Yoshihiko Nankaku

Name: dblp XML data dump
Creator: Schloss Dagstuhl - Leibniz Center for Informatics
Published: 1993
License: https://creativecommons.org/publicdomain/zero/1.0/
Keywords: dblp, XML, computer science, scholarly publications, metadata

> Home > Persons > Yoshihiko Nankaku

download as .bib file

@article{DBLP:journals/access/FujimotoHNT25,
  author       = {Takato Fujimoto and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {V2Coder: {A} Non-Autoregressive Vocoder Based on Hierarchical Variational
                  Autoencoders},
  journal      = {{IEEE} Access},
  volume       = {13},
  pages        = {92833--92847},
  year         = {2025},
  url          = {https://doi.org/10.1109/ACCESS.2025.3572904},
  doi          = {10.1109/ACCESS.2025.3572904},
  timestamp    = {Sun, 06 Jul 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/access/FujimotoHNT25.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/HonoHNT24,
  author       = {Yukiya Hono and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {PeriodGrad: Towards Pitch-Controllable Neural Vocoder Based on a Diffusion
                  Probabilistic Model},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2024, Seoul, Republic of Korea, April 14-19, 2024},
  pages        = {12782--12786},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/ICASSP48485.2024.10448502},
  doi          = {10.1109/ICASSP48485.2024.10448502},
  timestamp    = {Sun, 19 Jan 2025 13:18:23 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/HonoHNT24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2402-14692,
  author       = {Yukiya Hono and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {PeriodGrad: Towards Pitch-Controllable Neural Vocoder Based on a Diffusion
                  Probabilistic Model},
  journal      = {CoRR},
  volume       = {abs/2402.14692},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.14692},
  doi          = {10.48550/ARXIV.2402.14692},
  eprinttype    = {arXiv},
  eprint       = {2402.14692},
  timestamp    = {Fri, 22 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-14692.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/HonoHNT23,
  author       = {Yukiya Hono and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Singing Voice Synthesis Based on a Musical Note Position-Aware Attention
                  Mechanism},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10095919},
  doi          = {10.1109/ICASSP49357.2023.10095919},
  timestamp    = {Sun, 19 Jan 2025 13:18:24 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/HonoHNT23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/YoshimuraTNOHHNT23,
  author       = {Takenori Yoshimura and
                  Shinji Takaki and
                  Kazuhiro Nakamura and
                  Keiichiro Oura and
                  Yukiya Hono and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Embedding a Differentiable Mel-Cepstral Synthesis Filter to a Neural
                  Speech Synthesis System},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10094872},
  doi          = {10.1109/ICASSP49357.2023.10094872},
  timestamp    = {Sun, 05 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/YoshimuraTNOHHNT23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2301-02262,
  author       = {Miku Nishihara and
                  Yukiya Hono and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Singing voice synthesis based on frame-level sequence-to-sequence
                  models considering vocal timing deviation},
  journal      = {CoRR},
  volume       = {abs/2301.02262},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.02262},
  doi          = {10.48550/ARXIV.2301.02262},
  eprinttype    = {arXiv},
  eprint       = {2301.02262},
  timestamp    = {Tue, 10 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-02262.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/gcce/NakamuraHSTNK22,
  author       = {Yasutaka Nakamura and
                  Seiichi Harata and
                  Takuto Sakuma and
                  Yoshihiro Tanaka and
                  Yoshihiko Nankaku and
                  Shohei Kato},
  title        = {Enhancing Social Telepresence on Text Communication Using Robot Avatar
                  that Reflects User's Chatting States},
  booktitle    = {11th {IEEE} Global Conference on Consumer Electronics, {GCCE} 2022,
                  Osaka, Japan, October 18-21, 2022},
  pages        = {707--709},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/GCCE56475.2022.10014193},
  doi          = {10.1109/GCCE56475.2022.10014193},
  timestamp    = {Tue, 07 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/gcce/NakamuraHSTNK22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/FujimotoHNT22,
  author       = {Takato Fujimoto and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Autoregressive Variational Autoencoder with a Hidden Semi-Markov Model-Based
                  Structured Attention for Speech Synthesis},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2022, Virtual and Singapore, 23-27 May 2022},
  pages        = {7462--7466},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/ICASSP43922.2022.9746158},
  doi          = {10.1109/ICASSP43922.2022.9746158},
  timestamp    = {Tue, 07 Jun 2022 17:34:47 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/FujimotoHNT22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/MitsuiZSHNT22,
  author       = {Kentaro Mitsui and
                  Tianyu Zhao and
                  Kei Sawada and
                  Yukiya Hono and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {End-to-End Text-to-Speech Based on Latent Representation of Speaking
                  Styles Using Spontaneous Dialogue},
  booktitle    = {23rd Annual Conference of the International Speech Communication Association,
                  Interspeech 2022, Incheon, Korea, September 18-22, 2022},
  pages        = {2328--2332},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-259},
  doi          = {10.21437/INTERSPEECH.2022-259},
  timestamp    = {Tue, 17 Jun 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/MitsuiZSHNT22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2206-12040,
  author       = {Kentaro Mitsui and
                  Tianyu Zhao and
                  Kei Sawada and
                  Yukiya Hono and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {End-to-End Text-to-Speech Based on Latent Representation of Speaking
                  Styles Using Spontaneous Dialogue},
  journal      = {CoRR},
  volume       = {abs/2206.12040},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.12040},
  doi          = {10.48550/ARXIV.2206.12040},
  eprinttype    = {arXiv},
  eprint       = {2206.12040},
  timestamp    = {Tue, 17 Jun 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-12040.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2211-11222,
  author       = {Takenori Yoshimura and
                  Shinji Takaki and
                  Kazuhiro Nakamura and
                  Keiichiro Oura and
                  Yukiya Hono and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Embedding a Differentiable Mel-cepstral Synthesis Filter to a Neural
                  Speech Synthesis System},
  journal      = {CoRR},
  volume       = {abs/2211.11222},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.11222},
  doi          = {10.48550/ARXIV.2211.11222},
  eprinttype    = {arXiv},
  eprint       = {2211.11222},
  timestamp    = {Thu, 24 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-11222.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2212-13703,
  author       = {Yukiya Hono and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Singing Voice Synthesis Based on a Musical Note Position-Aware Attention
                  Mechanism},
  journal      = {CoRR},
  volume       = {abs/2212.13703},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.13703},
  doi          = {10.48550/ARXIV.2212.13703},
  eprinttype    = {arXiv},
  eprint       = {2212.13703},
  timestamp    = {Mon, 02 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-13703.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/access/HonoTHONT21,
  author       = {Yukiya Hono and
                  Shinji Takaki and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {PeriodNet: {A} Non-Autoregressive Raw Waveform Generative Model With
                  a Structure Separating Periodic and Aperiodic Components},
  journal      = {{IEEE} Access},
  volume       = {9},
  pages        = {137599--137612},
  year         = {2021},
  url          = {https://doi.org/10.1109/ACCESS.2021.3118033},
  doi          = {10.1109/ACCESS.2021.3118033},
  timestamp    = {Wed, 03 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/access/HonoTHONT21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/taslp/HonoHONT21,
  author       = {Yukiya Hono and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Sinsy: {A} Deep Neural Network-Based Singing Voice Synthesis System},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {29},
  pages        = {2803--2815},
  year         = {2021},
  url          = {https://doi.org/10.1109/TASLP.2021.3104165},
  doi          = {10.1109/TASLP.2021.3104165},
  timestamp    = {Sun, 19 Jan 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/HonoHONT21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/HonoTHONT21,
  author       = {Yukiya Hono and
                  Shinji Takaki and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Periodnet: {A} Non-Autoregressive Waveform Generation Model with a
                  Structure Separating Periodic and Aperiodic Components},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2021, Toronto, ON, Canada, June 6-11, 2021},
  pages        = {6049--6053},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICASSP39728.2021.9414401},
  doi          = {10.1109/ICASSP39728.2021.9414401},
  timestamp    = {Fri, 09 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/HonoTHONT21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2102-07786,
  author       = {Yukiya Hono and
                  Shinji Takaki and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {PeriodNet: {A} non-autoregressive waveform generation model with a
                  structure separating periodic and aperiodic components},
  journal      = {CoRR},
  volume       = {abs/2102.07786},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.07786},
  eprinttype    = {arXiv},
  eprint       = {2102.07786},
  timestamp    = {Fri, 19 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-07786.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2108-02776,
  author       = {Yukiya Hono and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Sinsy: {A} Deep Neural Network-Based Singing Voice Synthesis System},
  journal      = {CoRR},
  volume       = {abs/2108.02776},
  year         = {2021},
  url          = {https://arxiv.org/abs/2108.02776},
  eprinttype    = {arXiv},
  eprint       = {2108.02776},
  timestamp    = {Wed, 11 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2108-02776.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/NakamuraTHONT20,
  author       = {Kazuhiro Nakamura and
                  Shinji Takaki and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Fast and High-Quality Singing Voice Synthesis System Based on Convolutional
                  Neural Networks},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {7239--7243},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9053811},
  doi          = {10.1109/ICASSP40776.2020.9053811},
  timestamp    = {Thu, 23 Jul 2020 16:19:28 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/NakamuraTHONT20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/FujimotoTHONT20,
  author       = {Takato Fujimoto and
                  Shinji Takaki and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Semi-Supervised Learning Based on Hierarchical Generative Models for
                  End-to-End Speech Synthesis},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {7644--7648},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9054466},
  doi          = {10.1109/ICASSP40776.2020.9054466},
  timestamp    = {Thu, 23 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/FujimotoTHONT20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/HonoTSHONT20,
  author       = {Yukiya Hono and
                  Kazuna Tsuboi and
                  Kei Sawada and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {Hierarchical Multi-Grained Generative Model for Expressive Speech
                  Synthesis},
  booktitle    = {21st Annual Conference of the International Speech Communication Association,
                  Interspeech 2020, Virtual Event, Shanghai, China, October 25-29, 2020},
  pages        = {3441--3445},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://doi.org/10.21437/Interspeech.2020-2477},
  doi          = {10.21437/INTERSPEECH.2020-2477},
  timestamp    = {Sun, 19 Jan 2025 13:13:53 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/HonoTSHONT20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2009-08474,
  author       = {Yukiya Hono and
                  Kazuna Tsuboi and
                  Kei Sawada and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Hierarchical Multi-Grained Generative Model for Expressive Speech
                  Synthesis},
  journal      = {CoRR},
  volume       = {abs/2009.08474},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.08474},
  eprinttype    = {arXiv},
  eprint       = {2009.08474},
  timestamp    = {Wed, 23 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-08474.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/HonoHONT19,
  author       = {Yukiya Hono and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Singing Voice Synthesis Based on Generative Adversarial Networks},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019},
  pages        = {6955--6959},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICASSP.2019.8683154},
  doi          = {10.1109/ICASSP.2019.8683154},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/HonoHONT19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/YoshimuraHONT19,
  author       = {Takenori Yoshimura and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Speaker-dependent Wavenet-based Delay-free Adpcm Speech Coding},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019},
  pages        = {7145--7149},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICASSP.2019.8682264},
  doi          = {10.1109/ICASSP.2019.8682264},
  timestamp    = {Sun, 30 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/YoshimuraHONT19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ssw/OuraNHNT19,
  author       = {Keiichiro Oura and
                  Kazuhiro Nakamura and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Michael Pucher},
  title        = {Deep neural network based real-time speech vocoder with periodic and
                  aperiodic inputs},
  booktitle    = {10th {ISCA} Speech Synthesis Workshop, {SSW} 2019, Vienna, Austria,
                  September 20-22, 2019},
  pages        = {13--18},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/SSW.2019-3},
  doi          = {10.21437/SSW.2019-3},
  timestamp    = {Wed, 31 Jul 2024 13:04:37 +0200},
  biburl       = {https://dblp.org/rec/conf/ssw/OuraNHNT19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ssw/FujimotoHONT19,
  author       = {Takato Fujimoto and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Michael Pucher},
  title        = {Impacts of input linguistic feature representation on Japanese end-to-end
                  speech synthesis},
  booktitle    = {10th {ISCA} Speech Synthesis Workshop, {SSW} 2019, Vienna, Austria,
                  September 20-22, 2019},
  pages        = {166--171},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/SSW.2019-30},
  doi          = {10.21437/SSW.2019-30},
  timestamp    = {Wed, 31 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ssw/FujimotoHONT19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ssw/ShimadaHONT19,
  author       = {Motoki Shimada and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Michael Pucher},
  title        = {Low computational cost speech synthesis based on deep neural networks
                  using hidden semi-Markov model structures},
  booktitle    = {10th {ISCA} Speech Synthesis Workshop, {SSW} 2019, Vienna, Austria,
                  September 20-22, 2019},
  pages        = {177--182},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/SSW.2019-32},
  doi          = {10.21437/SSW.2019-32},
  timestamp    = {Wed, 31 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ssw/ShimadaHONT19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1904-06868,
  author       = {Kazuhiro Nakamura and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Singing voice synthesis based on convolutional neural networks},
  journal      = {CoRR},
  volume       = {abs/1904.06868},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.06868},
  eprinttype    = {arXiv},
  eprint       = {1904.06868},
  timestamp    = {Sat, 27 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-06868.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1910-11690,
  author       = {Kazuhiro Nakamura and
                  Shinji Takaki and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Fast and High-Quality Singing Voice Synthesis System based on Convolutional
                  Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1910.11690},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.11690},
  eprinttype    = {arXiv},
  eprint       = {1910.11690},
  timestamp    = {Thu, 31 Oct 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-11690.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/taslp/YoshimuraHONT18,
  author       = {Takenori Yoshimura and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Mel-Cepstrum-Based Quantization Noise Shaping Applied to Neural-Network-Based
                  Speech Waveform Synthesis},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {26},
  number       = {7},
  pages        = {1173--1180},
  year         = {2018},
  url          = {https://doi.org/10.1109/TASLP.2018.2818408},
  doi          = {10.1109/TASLP.2018.2818408},
  timestamp    = {Sun, 19 Jan 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/YoshimuraHONT18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/apsipa/KasugaiTSHONT18,
  author       = {Takayuki Kasugai and
                  Yoshinari Tsuzuki and
                  Kei Sawada and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Image Recognition Based on Convolutional Neural Networks Using Features
                  Generated from Separable Lattice Hidden Markov Models},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
                  12-15, 2018},
  pages        = {324--328},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.23919/APSIPA.2018.8659518},
  doi          = {10.23919/APSIPA.2018.8659518},
  timestamp    = {Wed, 16 Oct 2019 14:14:55 +0200},
  biburl       = {https://dblp.org/rec/conf/apsipa/KasugaiTSHONT18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/apsipa/NakaoHONT18,
  author       = {Kento Nakao and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Speaker Adaptation for Speech Synthesis Based on Deep Neural Networks
                  Using Hidden Semi-Markov Model Structures},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
                  12-15, 2018},
  pages        = {638--643},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.23919/APSIPA.2018.8659791},
  doi          = {10.23919/APSIPA.2018.8659791},
  timestamp    = {Sat, 09 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/NakaoHONT18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/apsipa/FujimotoYHONT18,
  author       = {Takato Fujimoto and
                  Takenori Yoshimura and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Speech Synthesis Using WaveNet Vocoder Based on Periodic/Aperiodic
                  Decomposition},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
                  12-15, 2018},
  pages        = {644--648},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.23919/APSIPA.2018.8659541},
  doi          = {10.23919/APSIPA.2018.8659541},
  timestamp    = {Sat, 09 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/FujimotoYHONT18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/apsipa/HonoMNHONT18,
  author       = {Yukiya Hono and
                  Shumma Murata and
                  Kazuhiro Nakamura and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Recent Development of the DNN-based Singing Voice Synthesis System
                  - Sinsy},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
                  12-15, 2018},
  pages        = {1003--1009},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.23919/APSIPA.2018.8659797},
  doi          = {10.23919/APSIPA.2018.8659797},
  timestamp    = {Sat, 09 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/HonoMNHONT18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/apsipa/YoshimuraKHONT18,
  author       = {Takenori Yoshimura and
                  Natsumi Koike and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Discriminative Feature Extraction Based on Sequential Variational
                  Autoencoder for Speaker Recognition},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
                  12-15, 2018},
  pages        = {1742--1746},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.23919/APSIPA.2018.8659722},
  doi          = {10.23919/APSIPA.2018.8659722},
  timestamp    = {Sat, 09 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/YoshimuraKHONT18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/apsipa/SendaHSHONT18,
  author       = {Koki Senda and
                  Yukiya Hono and
                  Kei Sawada and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Singing Voice Conversion Using Posted Waveform Data on Music Social
                  Media},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
                  12-15, 2018},
  pages        = {1913--1917},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.23919/APSIPA.2018.8659568},
  doi          = {10.23919/APSIPA.2018.8659568},
  timestamp    = {Sat, 09 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/apsipa/SendaHSHONT18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/blizzard/SawadaYHONT18,
  author       = {Kei Sawada and
                  Takenori Yoshimura and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {The NITech text-to-speech system for the Blizzard Challenge 2018},
  booktitle    = {The Blizzard Challenge 2018, Hyderabad, India, September 8, 2018},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Blizzard.2018-7},
  doi          = {10.21437/BLIZZARD.2018-7},
  timestamp    = {Fri, 20 Sep 2024 10:08:07 +0200},
  biburl       = {https://dblp.org/rec/conf/blizzard/SawadaYHONT18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/IchikawaSHNT18,
  author       = {Eiji Ichikawa and
                  Kei Sawada and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Image Recognition Based on Separable Lattice Hmms Using a Deep Neural
                  Network for Output Probability Distributions},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {3021--3025},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8461784},
  doi          = {10.1109/ICASSP.2018.8461784},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/IchikawaSHNT18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/NiwaYHONT18,
  author       = {Jumpei Niwa and
                  Takenori Yoshimura and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Statistical Voice Conversion Based on Wavenet},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {5289--5293},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8461948},
  doi          = {10.1109/ICASSP.2018.8461948},
  timestamp    = {Tue, 18 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/NiwaYHONT18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/slt/YoshimuraHONT18,
  author       = {Takenori Yoshimura and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {WaveNet-Based Zero-Delay Lossless Speech Coding},
  booktitle    = {2018 {IEEE} Spoken Language Technology Workshop, {SLT} 2018, Athens,
                  Greece, December 18-21, 2018},
  pages        = {153--158},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/SLT.2018.8639598},
  doi          = {10.1109/SLT.2018.8639598},
  timestamp    = {Wed, 16 Oct 2019 14:14:53 +0200},
  biburl       = {https://dblp.org/rec/conf/slt/YoshimuraHONT18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/taslp/YoshimuraHONT17,
  author       = {Takenori Yoshimura and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Simultaneous Optimization of Multiple Tree-Based Factor Analyzed {HMM}
                  for Speech Synthesis},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {25},
  number       = {9},
  pages        = {1836--1845},
  year         = {2017},
  url          = {https://doi.org/10.1109/TASLP.2017.2721219},
  doi          = {10.1109/TASLP.2017.2721219},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/YoshimuraHONT17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/TsuzukiSHNT17,
  author       = {Yoshinari Tsuzuki and
                  Kei Sawada and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Image recognition based on discriminative models using features generated
                  from separable lattice {HMMS}},
  booktitle    = {2017 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2017, New Orleans, LA, USA, March 5-9, 2017},
  pages        = {2607--2611},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICASSP.2017.7952628},
  doi          = {10.1109/ICASSP.2017.7952628},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/TsuzukiSHNT17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/GullyYMHNT17,
  author       = {Amelia Jane Gully and
                  Takenori Yoshimura and
                  Damian T. Murphy and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Francisco Lacerda},
  title        = {Articulatory Text-to-Speech Synthesis Using the Digital Waveguide
                  Mesh Driven by a Deep Neural Network},
  booktitle    = {18th Annual Conference of the International Speech Communication Association,
                  Interspeech 2017, Stockholm, Sweden, August 20-24, 2017},
  pages        = {234--238},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-900},
  doi          = {10.21437/INTERSPEECH.2017-900},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/GullyYMHNT17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@incollection{DBLP:books/sp/17/TokudaLNOHYTUTRY17,
  author       = {Keiichi Tokuda and
                  Akinobu Lee and
                  Yoshihiko Nankaku and
                  Keiichiro Oura and
                  Kei Hashimoto and
                  Daisuke Yamamoto and
                  Ichi Takumi and
                  Takahiro Uchiya and
                  Shuhei Tsutsumi and
                  Steve Renals and
                  Junichi Yamagishi},
  editor       = {Toyoaki Nishida},
  title        = {User Generated Dialogue Systems: uDialogue},
  booktitle    = {Human-Harmonized Information Technology, Volume 2, Horizontal Expansion},
  pages        = {77--114},
  publisher    = {Springer},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-4-431-56535-2\_3},
  doi          = {10.1007/978-4-431-56535-2\_3},
  timestamp    = {Wed, 12 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/books/sp/17/TokudaLNOHYTUTRY17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ieicet/SawadaTHNT16,
  author       = {Kei Sawada and
                  Akira Tamamori and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {A Bayesian Approach to Image Recognition Based on Separable Lattice
                  Hidden Markov Models},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {99-D},
  number       = {12},
  pages        = {3119--3131},
  year         = {2016},
  url          = {https://doi.org/10.1587/transinf.2016EDP7112},
  doi          = {10.1587/TRANSINF.2016EDP7112},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/SawadaTHNT16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/HashimotoONT16,
  author       = {Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Trajectory training considering global variance for speech synthesis
                  based on neural networks},
  booktitle    = {2016 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2016, Shanghai, China, March 20-25, 2016},
  pages        = {5600--5604},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/ICASSP.2016.7472749},
  doi          = {10.1109/ICASSP.2016.7472749},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/HashimotoONT16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/HosakaHONT16,
  author       = {Naoki Hosaka and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Nelson Morgan},
  title        = {Voice Conversion Based on Trajectory Model Training of Neural Networks
                  Considering Global Variance},
  booktitle    = {17th Annual Conference of the International Speech Communication Association,
                  Interspeech 2016, San Francisco, CA, USA, September 8-12, 2016},
  pages        = {307--311},
  publisher    = {{ISCA}},
  year         = {2016},
  url          = {https://doi.org/10.21437/Interspeech.2016-1035},
  doi          = {10.21437/INTERSPEECH.2016-1035},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HosakaHONT16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/NishimuraHONT16,
  author       = {Masanari Nishimura and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Nelson Morgan},
  title        = {Singing Voice Synthesis Based on Deep Neural Networks},
  booktitle    = {17th Annual Conference of the International Speech Communication Association,
                  Interspeech 2016, San Francisco, CA, USA, September 8-12, 2016},
  pages        = {2478--2482},
  publisher    = {{ISCA}},
  year         = {2016},
  url          = {https://doi.org/10.21437/Interspeech.2016-1027},
  doi          = {10.21437/INTERSPEECH.2016-1027},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/NishimuraHONT16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/DallHONT16,
  author       = {Rasmus Dall and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Nelson Morgan},
  title        = {Redefining the Linguistic Context Feature Set for {HMM} and {DNN}
                  {TTS} Through Position and Parsing},
  booktitle    = {17th Annual Conference of the International Speech Communication Association,
                  Interspeech 2016, San Francisco, CA, USA, September 8-12, 2016},
  pages        = {2851--2855},
  publisher    = {{ISCA}},
  year         = {2016},
  url          = {https://doi.org/10.21437/Interspeech.2016-399},
  doi          = {10.21437/INTERSPEECH.2016-399},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/DallHONT16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ssw/TokudaHON16,
  author       = {Keiichi Tokuda and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku},
  editor       = {Alan W. Black},
  title        = {Temporal modeling in neural network based statistical parametric speech
                  synthesis},
  booktitle    = {The 9th {ISCA} Speech Synthesis Workshop, {SSW} 2016, Sunnyvale, CA,
                  USA, September 13-15, 2016},
  pages        = {106--111},
  publisher    = {{ISCA}},
  year         = {2016},
  url          = {https://doi.org/10.21437/SSW.2016-18},
  doi          = {10.21437/SSW.2016-18},
  timestamp    = {Wed, 31 Jul 2024 11:28:11 +0200},
  biburl       = {https://dblp.org/rec/conf/ssw/TokudaHON16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/HashimotoONT15,
  author       = {Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {The effect of neural networks in statistical parametric speech synthesis},
  booktitle    = {2015 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2015, South Brisbane, Queensland, Australia,
                  April 19-24, 2015},
  pages        = {4455--4459},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/ICASSP.2015.7178813},
  doi          = {10.1109/ICASSP.2015.7178813},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/HashimotoONT15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/YoshimuraHNT15,
  author       = {Takenori Yoshimura and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Simultaneous optimization of multiple tree structures for factor analyzed
                  HMM-based speech synthesis},
  booktitle    = {16th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2015, Dresden, Germany, September 6-10, 2015},
  pages        = {1196--1200},
  publisher    = {{ISCA}},
  year         = {2015},
  url          = {https://doi.org/10.21437/Interspeech.2015-303},
  doi          = {10.21437/INTERSPEECH.2015-303},
  timestamp    = {Sun, 19 Jan 2025 13:13:53 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/YoshimuraHNT15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/GangireddyRNL15,
  author       = {Siva Reddy Gangireddy and
                  Steve Renals and
                  Yoshihiko Nankaku and
                  Akinobu Lee},
  title        = {Prosodically-enhanced recurrent neural network language models},
  booktitle    = {16th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2015, Dresden, Germany, September 6-10, 2015},
  pages        = {2390--2394},
  publisher    = {{ISCA}},
  year         = {2015},
  url          = {https://doi.org/10.21437/Interspeech.2015-517},
  doi          = {10.21437/INTERSPEECH.2015-517},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/GangireddyRNL15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ieicet/NakamuraHNT14,
  author       = {Kazuhiro Nakamura and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Integration of Spectral Feature Extraction and Modeling for HMM-Based
                  Speech Synthesis},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {97-D},
  number       = {6},
  pages        = {1438--1448},
  year         = {2014},
  url          = {https://doi.org/10.1587/transinf.E97.D.1438},
  doi          = {10.1587/TRANSINF.E97.D.1438},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/NakamuraHNT14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ieicet/TamamoriNT14,
  author       = {Akira Tamamori and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Image Recognition Based on Separable Lattice Trajectory 2-D HMMs},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {97-D},
  number       = {7},
  pages        = {1842--1854},
  year         = {2014},
  url          = {https://doi.org/10.1587/transinf.E97.D.1842},
  doi          = {10.1587/TRANSINF.E97.D.1842},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/TamamoriNT14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/jstsp/TakakiNT14,
  author       = {Shinji Takaki and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Contextual Additive Structure for HMM-Based Speech Synthesis},
  journal      = {{IEEE} J. Sel. Top. Signal Process.},
  volume       = {8},
  number       = {2},
  pages        = {229--238},
  year         = {2014},
  url          = {https://doi.org/10.1109/JSTSP.2014.2305919},
  doi          = {10.1109/JSTSP.2014.2305919},
  timestamp    = {Thu, 09 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jstsp/TakakiNT14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/NakamuraONT14,
  author       = {Kazuhiro Nakamura and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {HMM-Based singing voice synthesis and its application to Japanese
                  and English},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2014, Florence, Italy, May 4-9, 2014},
  pages        = {265--269},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ICASSP.2014.6853599},
  doi          = {10.1109/ICASSP.2014.6853599},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/NakamuraONT14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/ShirotaNHONT14,
  author       = {Kanako Shirota and
                  Kazuhiro Nakamura and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Integration of speaker and pitch adaptive training for HMM-based singing
                  voice synthesis},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2014, Florence, Italy, May 4-9, 2014},
  pages        = {2559--2563},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ICASSP.2014.6854062},
  doi          = {10.1109/ICASSP.2014.6854062},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ShirotaNHONT14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/NakamuraHONT14,
  author       = {Kazuhiro Nakamura and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Haizhou Li and
                  Helen M. Meng and
                  Bin Ma and
                  Engsiong Chng and
                  Lei Xie},
  title        = {A mel-cepstral analysis technique restoring high frequency components
                  from low-sampling-rate speech},
  booktitle    = {15th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2014, Singapore, September 14-18, 2014},
  pages        = {2494--2498},
  publisher    = {{ISCA}},
  year         = {2014},
  url          = {https://doi.org/10.21437/Interspeech.2014-535},
  doi          = {10.21437/INTERSPEECH.2014-535},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/NakamuraHONT14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ieicet/ShiotaHNT13,
  author       = {Sayaka Shiota and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {A Bayesian Framework Using Multiple Model Structures for Speech Recognition},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {96-D},
  number       = {4},
  pages        = {939--948},
  year         = {2013},
  url          = {https://doi.org/10.1587/transinf.E96.D.939},
  doi          = {10.1587/TRANSINF.E96.D.939},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/ShiotaHNT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/pieee/TokudaNTZYO13,
  author       = {Keiichi Tokuda and
                  Yoshihiko Nankaku and
                  Tomoki Toda and
                  Heiga Zen and
                  Junichi Yamagishi and
                  Keiichiro Oura},
  title        = {Speech Synthesis Based on Hidden Markov Models},
  journal      = {Proc. {IEEE}},
  volume       = {101},
  number       = {5},
  pages        = {1234--1252},
  year         = {2013},
  url          = {https://doi.org/10.1109/JPROC.2013.2251852},
  doi          = {10.1109/JPROC.2013.2251852},
  timestamp    = {Sun, 06 Oct 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pieee/TokudaNTZYO13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/apsipa/SawadaHNT13,
  author       = {Kei Sawada and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Image recognition based on hidden Markov eigen-image models using
                  variational Bayesian method},
  booktitle    = {Asia-Pacific Signal and Information Processing Association Annual
                  Summit and Conference, {APSIPA} 2013, Kaohsiung, Taiwan, October 29
                  - November 1, 2013},
  pages        = {1--8},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/APSIPA.2013.6694382},
  doi          = {10.1109/APSIPA.2013.6694382},
  timestamp    = {Wed, 16 Oct 2019 14:14:55 +0200},
  biburl       = {https://dblp.org/rec/conf/apsipa/SawadaHNT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/MakinoTHNT13,
  author       = {Takaya Makino and
                  Shinji Takaki and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Separable lattice 2-D {HMMS} introducing state duration control for
                  recognition of images with various variations},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
  pages        = {3203--3207},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICASSP.2013.6638249},
  doi          = {10.1109/ICASSP.2013.6638249},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MakinoTHNT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/TamamoriNT13,
  author       = {Akira Tamamori and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Image recognition based on separable lattice trajectory 2-D {HMMS}},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
  pages        = {3467--3471},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICASSP.2013.6638302},
  doi          = {10.1109/ICASSP.2013.6638302},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/TamamoriNT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/TakakiNT13,
  author       = {Shinji Takaki and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Contextual partial additive structure for HMM-based speech synthesis},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
  pages        = {7878--7882},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICASSP.2013.6639198},
  doi          = {10.1109/ICASSP.2013.6639198},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/TakakiNT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/NakamuraHNT13,
  author       = {Kazuhiro Nakamura and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Integration of acoustic modeling and mel-cepstral analysis for HMM-based
                  speech synthesis},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
  pages        = {7883--7887},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICASSP.2013.6639199},
  doi          = {10.1109/ICASSP.2013.6639199},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/NakamuraHNT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ssw/YoshimuraHONT13,
  author       = {Takenori Yoshimura and
                  Kei Hashimoto and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Cross-lingual speaker adaptation based on factor analysis using bilingual
                  speech data for HMM-based speech synthesis},
  booktitle    = {The Eighth {ISCA} Tutorial and Research Workshop on Speech Synthesis,
                  {SSW} 2013, Barcelona, Spain, August 31 - September 2, 2013},
  pages        = {297--302},
  publisher    = {{ISCA}},
  year         = {2013},
  url          = {https://www.isca-archive.org/ssw\_2013/yoshimura13\_ssw.html},
  timestamp    = {Fri, 02 Aug 2024 09:01:40 +0200},
  biburl       = {https://dblp.org/rec/conf/ssw/YoshimuraHONT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ieicet/TamamoriNT12,
  author       = {Akira Tamamori and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {An Extension of Separable Lattice 2-D HMMs for Rotational Data Variations},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {95-D},
  number       = {8},
  pages        = {2074--2083},
  year         = {2012},
  url          = {https://doi.org/10.1587/transinf.E95.D.2074},
  doi          = {10.1587/TRANSINF.E95.D.2074},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/TamamoriNT12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/taslp/ZenGNT12,
  author       = {Heiga Zen and
                  Mark J. F. Gales and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Product of Experts for Statistical Parametric Speech Synthesis},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {20},
  number       = {3},
  pages        = {794--805},
  year         = {2012},
  url          = {https://doi.org/10.1109/TASL.2011.2165280},
  doi          = {10.1109/TASL.2011.2165280},
  timestamp    = {Sun, 06 Oct 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/ZenGNT12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/SawadaTHNT12,
  author       = {Kei Sawada and
                  Akira Tamamori and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Face recognition based on separable lattice 2-D {HMMS} using variational
                  bayesian method},
  booktitle    = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
  pages        = {2205--2208},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICASSP.2012.6288351},
  doi          = {10.1109/ICASSP.2012.6288351},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/SawadaTHNT12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/KumakiNT12,
  author       = {Keisuke Kumaki and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Face recognition based on extended separable lattice 2-D {HMMS}},
  booktitle    = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
  pages        = {2209--2212},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICASSP.2012.6288352},
  doi          = {10.1109/ICASSP.2012.6288352},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KumakiNT12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/ShiotaHNT12,
  author       = {Sayaka Shiota and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {A model structure integration based on a Bayesian framework for speech
                  recognition},
  booktitle    = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
  pages        = {4813--4816},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICASSP.2012.6288996},
  doi          = {10.1109/ICASSP.2012.6288996},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ShiotaHNT12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/OuraMNT12,
  author       = {Keiichiro Oura and
                  Ayami Mase and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Pitch adaptive training for hmm-based singing voice synthesis},
  booktitle    = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
  pages        = {5377--5380},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICASSP.2012.6289136},
  doi          = {10.1109/ICASSP.2012.6289136},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/OuraMNT12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/OliveiraSNT12,
  author       = {Viviane de Franca Oliveira and
                  Sayaka Shiota and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Cross-lingual Speaker Adaptation for HMM-based Speech Synthesis based
                  on Perceptual Characteristics and Speaker Interpolation},
  booktitle    = {13th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2012, Portland, Oregon, USA, September 9-13, 2012},
  pages        = {983--986},
  publisher    = {{ISCA}},
  year         = {2012},
  url          = {https://doi.org/10.21437/Interspeech.2012-292},
  doi          = {10.21437/INTERSPEECH.2012-292},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/OliveiraSNT12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/HattoriHNT12,
  author       = {Takafumi Hattori and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {A Bayesian Approach to Speaker Recognition Based on GMMs Using Multiple
                  Model Structures},
  booktitle    = {13th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2012, Portland, Oregon, USA, September 9-13, 2012},
  pages        = {1107--1110},
  publisher    = {{ISCA}},
  year         = {2012},
  url          = {https://doi.org/10.21437/Interspeech.2012-334},
  doi          = {10.21437/INTERSPEECH.2012-334},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HattoriHNT12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ieicet/HashimotoZNLT11,
  author       = {Kei Hashimoto and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Akinobu Lee and
                  Keiichi Tokuda},
  title        = {Bayesian Context Clustering Using Cross Validation for Speech Recognition},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {94-D},
  number       = {3},
  pages        = {668--678},
  year         = {2011},
  url          = {https://doi.org/10.1587/transinf.E94.D.668},
  doi          = {10.1587/TRANSINF.E94.D.668},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/HashimotoZNLT11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/taslp/ZenNT11,
  author       = {Heiga Zen and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Continuous Stochastic Feature Mapping Based on Trajectory HMMs},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {19},
  number       = {2},
  pages        = {417--430},
  year         = {2011},
  url          = {https://doi.org/10.1109/TASL.2010.2049685},
  doi          = {10.1109/TASL.2010.2049685},
  timestamp    = {Sun, 06 Oct 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/ZenNT11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/TakakiONT11,
  author       = {Shinji Takaki and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {An optimization algorithm of independent mean and variance parameter
                  tying structures for HMM-based speech synthesis},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress
                  Center, Prague, Czech Republic},
  pages        = {4700--4703},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ICASSP.2011.5947404},
  doi          = {10.1109/ICASSP.2011.5947404},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/TakakiONT11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/PanNTT11,
  author       = {Shifeng Pan and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda and
                  Jianhua Tao},
  title        = {Global variance modeling on frequency domain delta {LSP} for HMM-based
                  speech synthesis},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress
                  Center, Prague, Czech Republic},
  pages        = {4716--4719},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ICASSP.2011.5947408},
  doi          = {10.1109/ICASSP.2011.5947408},
  timestamp    = {Mon, 18 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/PanNTT11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/HashimotoNT11,
  author       = {Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Multi-Speaker Modeling with Shared Prior Distributions and Model Structures
                  for Bayesian Speech Synthesis},
  booktitle    = {12th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2011, Florence, Italy, August 27-31, 2011},
  pages        = {113--116},
  publisher    = {{ISCA}},
  year         = {2011},
  url          = {https://doi.org/10.21437/Interspeech.2011-29},
  doi          = {10.21437/INTERSPEECH.2011-29},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HashimotoNT11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/LiNT11,
  author       = {Lei Li and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {A Bayesian Approach to Voice Conversion Based on GMMs Using Multiple
                  Model Structures},
  booktitle    = {12th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2011, Florence, Italy, August 27-31, 2011},
  pages        = {661--664},
  publisher    = {{ISCA}},
  year         = {2011},
  url          = {https://doi.org/10.21437/Interspeech.2011-270},
  doi          = {10.21437/INTERSPEECH.2011-270},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/LiNT11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/RemesNT11,
  author       = {Ulpu Remes and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {GMM-Based Missing-Feature Reconstruction on Multi-Frame Windows},
  booktitle    = {12th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2011, Florence, Italy, August 27-31, 2011},
  pages        = {1665--1668},
  publisher    = {{ISCA}},
  year         = {2011},
  url          = {https://doi.org/10.21437/Interspeech.2011-214},
  doi          = {10.21437/INTERSPEECH.2011-214},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/RemesNT11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/ChenNZTLD11,
  author       = {Ling{-}Hui Chen and
                  Yoshihiko Nankaku and
                  Heiga Zen and
                  Keiichi Tokuda and
                  Zhen{-}Hua Ling and
                  Li{-}Rong Dai},
  title        = {Estimation of Window Coefficients for Dynamic Feature Extraction for
                  HMM-Based Speech Synthesis},
  booktitle    = {12th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2011, Florence, Italy, August 27-31, 2011},
  pages        = {1801--1804},
  publisher    = {{ISCA}},
  year         = {2011},
  url          = {https://doi.org/10.21437/Interspeech.2011-33},
  doi          = {10.21437/INTERSPEECH.2011-33},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ChenNZTLD11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/ItoNL11,
  author       = {Naoaki Ito and
                  Yoshihiko Nankaku and
                  Akinobu Lee},
  title        = {Evaluation of Tree-Trellis Based Decoding in Over-Million {LVCSR}},
  booktitle    = {12th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2011, Florence, Italy, August 27-31, 2011},
  pages        = {1937--1940},
  publisher    = {{ISCA}},
  year         = {2011},
  url          = {https://doi.org/10.21437/Interspeech.2011-362},
  doi          = {10.21437/INTERSPEECH.2011-362},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ItoNL11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ieicet/OuraZNLT10,
  author       = {Keiichiro Oura and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Akinobu Lee and
                  Keiichi Tokuda},
  title        = {A Covariance-Tying Technique for HMM-Based Speech Synthesis},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {93-D},
  number       = {3},
  pages        = {595--601},
  year         = {2010},
  url          = {https://doi.org/10.1587/transinf.E93.D.595},
  doi          = {10.1587/TRANSINF.E93.D.595},
  timestamp    = {Sun, 06 Oct 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/OuraZNLT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/eamt/Martinez-GomezH10,
  author       = {Pascual Mart{\'{\i}}nez{-}G{\'{o}}mez and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda and
                  Germ{\'{a}}n Sanchis{-}Trilles},
  editor       = {Fran{\c{c}}ois Yvon and
                  Viggo Hansen},
  title        = {A Deterministic Annealing-Based Training Algorithm For Statistical
                  Machine Translation Models},
  booktitle    = {Proceedings of the 14th Annual conference of the European Association
                  for Machine Translation, {EAMT} 2010, Saint Rapha{\"{e}}l, France,
                  May 27-28, 2010},
  publisher    = {European Association for Machine Translation},
  year         = {2010},
  url          = {https://aclanthology.org/2010.eamt-1.20/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eamt/Martinez-GomezH10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/TakahashiTNT10,
  author       = {Yoshiaki Takahashi and
                  Akira Tamamori and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Face recognition based on separable lattice 2-D {HMM} with state duration
                  modeling},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {2162--2165},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495625},
  doi          = {10.1109/ICASSP.2010.5495625},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/TakahashiTNT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/TamamoriNT10,
  author       = {Akira Tamamori and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {An extension of Separable Lattice 2-D {HMMS} for rotational data variations},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {2206--2209},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495735},
  doi          = {10.1109/ICASSP.2010.5495735},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/TamamoriNT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/KazumiNT10,
  author       = {Kyosuke Kazumi and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Factor analyzed voice models for HMM-based speech synthesis},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {4234--4237},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495689},
  doi          = {10.1109/ICASSP.2010.5495689},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KazumiNT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/ZenGNT10,
  author       = {Heiga Zen and
                  Mark J. F. Gales and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Statistical parametric speech synthesis based on product of experts},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {4242--4245},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495691},
  doi          = {10.1109/ICASSP.2010.5495691},
  timestamp    = {Sun, 06 Oct 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ZenGNT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/HayashiNLT10,
  author       = {Toyohiro Hayashi and
                  Yoshihiko Nankaku and
                  Akinobu Lee and
                  Keiichi Tokuda},
  editor       = {Takao Kobayashi and
                  Keikichi Hirose and
                  Satoshi Nakamura},
  title        = {Speaker adaptation based on nonlinear spectral transform for speech
                  recognition},
  booktitle    = {11th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2010, Makuhari, Chiba, Japan, September 26-30, 2010},
  pages        = {542--545},
  publisher    = {{ISCA}},
  year         = {2010},
  url          = {https://doi.org/10.21437/Interspeech.2010-218},
  doi          = {10.21437/INTERSPEECH.2010-218},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HayashiNLT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/MaseONT10,
  author       = {Ayami Mase and
                  Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Takao Kobayashi and
                  Keikichi Hirose and
                  Satoshi Nakamura},
  title        = {HMM-based singing voice synthesis system using pitch-shifted pseudo
                  training data},
  booktitle    = {11th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2010, Makuhari, Chiba, Japan, September 26-30, 2010},
  pages        = {845--848},
  publisher    = {{ISCA}},
  year         = {2010},
  url          = {https://doi.org/10.21437/Interspeech.2010-188},
  doi          = {10.21437/INTERSPEECH.2010-188},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/MaseONT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/SaitoNLT10,
  author       = {Akira Saito and
                  Yoshihiko Nankaku and
                  Akinobu Lee and
                  Keiichi Tokuda},
  editor       = {Takao Kobayashi and
                  Keikichi Hirose and
                  Satoshi Nakamura},
  title        = {Voice activity detection based on conditional random fields using
                  multiple features},
  booktitle    = {11th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2010, Makuhari, Chiba, Japan, September 26-30, 2010},
  pages        = {2086--2089},
  publisher    = {{ISCA}},
  year         = {2010},
  url          = {https://doi.org/10.21437/Interspeech.2010-588},
  doi          = {10.21437/INTERSPEECH.2010-588},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SaitoNLT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ssw/TakakiNT10,
  author       = {Shinji Takaki and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Yoshinori Sagisaka and
                  Keiichi Tokuda},
  title        = {Spectral modeling with contextual additive structure for HMM-based
                  speech synthesis},
  booktitle    = {The Seventh {ISCA} Tutorial and Research Workshop on Speech Synthesis,
                  {SSW} 2010, Kyoto, Japan, September 22-24, 2010},
  pages        = {100--105},
  publisher    = {{ISCA}},
  year         = {2010},
  url          = {https://www.isca-archive.org/ssw\_2010/takaki10\_ssw.html},
  timestamp    = {Fri, 02 Aug 2024 09:01:35 +0200},
  biburl       = {https://dblp.org/rec/conf/ssw/TakakiNT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ssw/HashimotoNT10,
  author       = {Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Yoshinori Sagisaka and
                  Keiichi Tokuda},
  title        = {Bayesian speech synthesis framework integrating training and synthesis
                  processes},
  booktitle    = {The Seventh {ISCA} Tutorial and Research Workshop on Speech Synthesis,
                  {SSW} 2010, Kyoto, Japan, September 22-24, 2010},
  pages        = {106--111},
  publisher    = {{ISCA}},
  year         = {2010},
  url          = {https://www.isca-archive.org/ssw\_2010/hashimoto10\_ssw.html},
  timestamp    = {Wed, 31 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ssw/HashimotoNT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ssw/OuraMYMNT10,
  author       = {Keiichiro Oura and
                  Ayami Mase and
                  Tomohiko Yamada and
                  Satoru Muto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Yoshinori Sagisaka and
                  Keiichi Tokuda},
  title        = {Recent development of the HMM-based singing voice synthesis system
                  - Sinsy},
  booktitle    = {The Seventh {ISCA} Tutorial and Research Workshop on Speech Synthesis,
                  {SSW} 2010, Kyoto, Japan, September 22-24, 2010},
  pages        = {211--216},
  publisher    = {{ISCA}},
  year         = {2010},
  url          = {https://www.isca-archive.org/ssw\_2010/oura10\_ssw.html},
  timestamp    = {Wed, 31 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ssw/OuraMYMNT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/YutaniUNLT09,
  author       = {Kaori Yutani and
                  Yosuke Uto and
                  Yoshihiko Nankaku and
                  Akinobu Lee and
                  Keiichi Tokuda},
  title        = {Voice conversion based on simultaneous modelling of spectrum and {F0}},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
  pages        = {3897--3900},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICASSP.2009.4960479},
  doi          = {10.1109/ICASSP.2009.4960479},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/YutaniUNLT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/HashimotoZNMT09,
  author       = {Kei Hashimoto and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Takashi Masuko and
                  Keiichi Tokuda},
  title        = {A Bayesian approach to HMM-based speech synthesis},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
  pages        = {4029--4032},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICASSP.2009.4960512},
  doi          = {10.1109/ICASSP.2009.4960512},
  timestamp    = {Sun, 06 Oct 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/HashimotoZNMT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/ZenNT09,
  author       = {Heiga Zen and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Stereo-based stochastic noise compensation based on trajectory {GMMS}},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
  pages        = {4577--4580},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICASSP.2009.4960649},
  doi          = {10.1109/ICASSP.2009.4960649},
  timestamp    = {Sun, 06 Oct 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ZenNT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/WuNT09,
  author       = {Yi{-}Jian Wu and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {State mapping based method for cross-lingual speaker adaptation in
                  HMM-based speech synthesis},
  booktitle    = {10th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2009, Brighton, United Kingdom, September 6-10, 2009},
  pages        = {528--531},
  publisher    = {{ISCA}},
  year         = {2009},
  url          = {https://doi.org/10.21437/Interspeech.2009-192},
  doi          = {10.21437/INTERSPEECH.2009-192},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/WuNT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/ShiotaHNT09,
  author       = {Sayaka Shiota and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Deterministic annealing based training algorithm for Bayesian speech
                  recognition},
  booktitle    = {10th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2009, Brighton, United Kingdom, September 6-10, 2009},
  pages        = {680--683},
  publisher    = {{ISCA}},
  year         = {2009},
  url          = {https://doi.org/10.21437/Interspeech.2009-236},
  doi          = {10.21437/INTERSPEECH.2009-236},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ShiotaHNT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/HashimotoNT09,
  author       = {Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {A Bayesian approach to Hidden Semi-Markov Model based speech synthesis},
  booktitle    = {10th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2009, Brighton, United Kingdom, September 6-10, 2009},
  pages        = {1751--1754},
  publisher    = {{ISCA}},
  year         = {2009},
  url          = {https://doi.org/10.21437/Interspeech.2009-141},
  doi          = {10.21437/INTERSPEECH.2009-141},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HashimotoNT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/OuraZNLT09,
  author       = {Keiichiro Oura and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Akinobu Lee and
                  Keiichi Tokuda},
  title        = {Tying covariance matrices to reduce the footprint of HMM-based speech
                  synthesis systems},
  booktitle    = {10th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2009, Brighton, United Kingdom, September 6-10, 2009},
  pages        = {1759--1762},
  publisher    = {{ISCA}},
  year         = {2009},
  url          = {https://doi.org/10.21437/Interspeech.2009-143},
  doi          = {10.21437/INTERSPEECH.2009-143},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/OuraZNLT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ieicet/OuraZNLT08,
  author       = {Keiichiro Oura and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Akinobu Lee and
                  Keiichi Tokuda},
  title        = {A Fully Consistent Hidden Semi-Markov Model-Based Speech Recognition
                  System},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {91-D},
  number       = {11},
  pages        = {2693--2700},
  year         = {2008},
  url          = {https://doi.org/10.1093/ietisy/e91-d.11.2693},
  doi          = {10.1093/IETISY/E91-D.11.2693},
  timestamp    = {Sun, 06 Oct 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/OuraZNLT08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/NankakuNZT08,
  author       = {Yoshihiko Nankaku and
                  Kazuhiro Nakamura and
                  Heiga Zen and
                  Keiichi Tokuda},
  title        = {Acoustic modeling with contextual additive structure for HMM-based
                  speech recognition},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2008, March 30 - April 4, 2008, Caesars
                  Palace, Las Vegas, Nevada, {USA}},
  pages        = {4469--4472},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ICASSP.2008.4518648},
  doi          = {10.1109/ICASSP.2008.4518648},
  timestamp    = {Sun, 06 Oct 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/NankakuNZT08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/YoshimiKNLT08,
  author       = {Yoshitaka Yoshimi and
                  Ryota Kakitsuba and
                  Yoshihiko Nankaku and
                  Akinobu Lee and
                  Keiichi Tokuda},
  title        = {Probabilistic answer selection based on conditional random fields
                  for spoken dialog system},
  booktitle    = {9th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
  pages        = {215--218},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-67},
  doi          = {10.21437/INTERSPEECH.2008-67},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/YoshimiKNLT08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/ShiotaHZNLT08,
  author       = {Sayaka Shiota and
                  Kei Hashimoto and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Akinobu Lee and
                  Keiichi Tokuda},
  title        = {Acoustic modeling based on model structure annealing for speech recognition},
  booktitle    = {9th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
  pages        = {932--935},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-111},
  doi          = {10.21437/INTERSPEECH.2008-111},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ShiotaHZNLT08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/HashimotoZNLT08,
  author       = {Kei Hashimoto and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Akinobu Lee and
                  Keiichi Tokuda},
  title        = {Bayesian context clustering using cross valid prior distribution for
                  HMM-based speech recognition},
  booktitle    = {9th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
  pages        = {936--939},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-112},
  doi          = {10.21437/INTERSPEECH.2008-112},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HashimotoZNLT08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/ZenNT08,
  author       = {Heiga Zen and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Probabilistic feature mapping based on trajectory HMMs},
  booktitle    = {9th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
  pages        = {1068--1071},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-330},
  doi          = {10.21437/INTERSPEECH.2008-330},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ZenNT08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/YutaniUNTT08,
  author       = {Kaori Yutani and
                  Yosuke Uto and
                  Yoshihiko Nankaku and
                  Tomoki Toda and
                  Keiichi Tokuda},
  title        = {Simultaneous conversion of duration and spectrum based on statistical
                  models including time-sequence matching},
  booktitle    = {9th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
  pages        = {1072--1075},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-331},
  doi          = {10.21437/INTERSPEECH.2008-331},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/YutaniUNTT08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/ItoHNLT08,
  author       = {Tatsuya Ito and
                  Kei Hashimoto and
                  Yoshihiko Nankaku and
                  Akinobu Lee and
                  Keiichi Tokuda},
  title        = {Speaker recognition based on variational Bayesian method},
  booktitle    = {9th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
  pages        = {1417--1420},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-410},
  doi          = {10.21437/INTERSPEECH.2008-410},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ItoHNLT08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/iscslp/OuraNTTMSN08,
  author       = {Keiichiro Oura and
                  Yoshihiko Nankaku and
                  Tomoki Toda and
                  Keiichi Tokuda and
                  Ranniery Maia and
                  Shinsuke Sakai and
                  Satoshi Nakamura},
  editor       = {Helen M. Meng and
                  Hui Jiang and
                  Jianhua Tao and
                  Ren{-}Hua Wang},
  title        = {Simultaneous Acoustic, Prosodic, and Phrasing Model Training for TTs
                  Conversion Systems},
  booktitle    = {6th International Symposium on Chinese Spoken Language Processing,
                  {ISCSLP} 2008, 16-19 December, 2008, Kunming, China},
  pages        = {1--4},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/CHINSL.2008.ECP.12},
  doi          = {10.1109/CHINSL.2008.ECP.12},
  timestamp    = {Wed, 18 Sep 2024 12:50:19 +0200},
  biburl       = {https://dblp.org/rec/conf/iscslp/OuraNTTMSN08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/NankakuT07,
  author       = {Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Face Recognition using Hidden Markov Eigenface Models},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2007, Honolulu, Hawaii, USA, April
                  15-20, 2007},
  pages        = {469--472},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ICASSP.2007.366274},
  doi          = {10.1109/ICASSP.2007.366274},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/NankakuT07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/MaiaTZNT07,
  author       = {Ranniery Maia and
                  Tomoki Toda and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {A trainable excitation model for HMM-based speech synthesis},
  booktitle    = {8th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2007, Antwerp, Belgium, August 27-31, 2007},
  pages        = {1909--1912},
  publisher    = {{ISCA}},
  year         = {2007},
  url          = {https://doi.org/10.21437/Interspeech.2007-530},
  doi          = {10.21437/INTERSPEECH.2007-530},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/MaiaTZNT07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/ZenNT07,
  author       = {Heiga Zen and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Model-space {MLLR} for trajectory HMMs},
  booktitle    = {8th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2007, Antwerp, Belgium, August 27-31, 2007},
  pages        = {2065--2068},
  publisher    = {{ISCA}},
  year         = {2007},
  url          = {https://doi.org/10.21437/Interspeech.2007-559},
  doi          = {10.21437/INTERSPEECH.2007-559},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ZenNT07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ssw/MaiaTZNT07,
  author       = {Ranniery Maia and
                  Tomoki Toda and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  editor       = {Petra Wagner and
                  Julia Abresch and
                  Stefan Breuer and
                  Wolfgang Hess},
  title        = {An excitation model for HMM-based speech synthesis based on residual
                  modeling},
  booktitle    = {Sixth {ISCA} Workshop on Speech Synthesis, {SSW} 2007, Bonn, Germany,
                  August 22-24, 2007},
  pages        = {131--136},
  publisher    = {{ISCA}},
  year         = {2007},
  url          = {https://www.isca-archive.org/ssw\_2007/maia07\_ssw.html},
  timestamp    = {Fri, 02 Aug 2024 09:01:26 +0200},
  biburl       = {https://dblp.org/rec/conf/ssw/MaiaTZNT07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ssw/NankakuNTT07,
  author       = {Yoshihiko Nankaku and
                  Kenichi Nakamura and
                  Tomoki Toda and
                  Keiichi Tokuda},
  editor       = {Petra Wagner and
                  Julia Abresch and
                  Stefan Breuer and
                  Wolfgang Hess},
  title        = {Spectral conversion based on statistical models including time-sequence
                  matching},
  booktitle    = {Sixth {ISCA} Workshop on Speech Synthesis, {SSW} 2007, Bonn, Germany,
                  August 22-24, 2007},
  pages        = {333--338},
  publisher    = {{ISCA}},
  year         = {2007},
  url          = {https://www.isca-archive.org/ssw\_2007/nankaku07\_ssw.html},
  timestamp    = {Wed, 31 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ssw/NankakuNTT07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/OuraZNLT06,
  author       = {Keiichiro Oura and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Akinobu Lee and
                  Keiichi Tokuda},
  title        = {Hidden Semi-Markov Model Based Speech Recognition System using Weighted
                  Finite-State Transducer},
  booktitle    = {2006 {IEEE} International Conference on Acoustics Speech and Signal
                  Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
  pages        = {33--36},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/ICASSP.2006.1659950},
  doi          = {10.1109/ICASSP.2006.1659950},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/OuraZNLT06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/NakamuraTNT06,
  author       = {Kenichi Nakamura and
                  Tomoki Toda and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {On the Use of Phonetic Information for Mapping from Articulatory Movements
                  to Vocal Tract Spectrum},
  booktitle    = {2006 {IEEE} International Conference on Acoustics Speech and Signal
                  Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
  pages        = {93--96},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/ICASSP.2006.1659965},
  doi          = {10.1109/ICASSP.2006.1659965},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/NakamuraTNT06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/KurataNTKG06,
  author       = {Daisuke Kurata and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda and
                  Tadashi Kitamura and
                  Zoubin Ghahramani},
  title        = {Face Recognition Based on Separable Lattice {HMMS}},
  booktitle    = {2006 {IEEE} International Conference on Acoustics Speech and Signal
                  Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
  pages        = {737--740},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/ICASSP.2006.1661381},
  doi          = {10.1109/ICASSP.2006.1661381},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KurataNTKG06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/ZenNTK06,
  author       = {Heiga Zen and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda and
                  Tadashi Kitamura},
  title        = {Estimating Trajectory Hmm Parameters Using Monte Carlo Em With Gibbs
                  Sampler},
  booktitle    = {2006 {IEEE} International Conference on Acoustics Speech and Signal
                  Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
  pages        = {1173--1176},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/ICASSP.2006.1660235},
  doi          = {10.1109/ICASSP.2006.1660235},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ZenNTK06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/HakamataLNT06,
  author       = {Tomohiro Hakamata and
                  Akinobu Lee and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda},
  title        = {Reducing computation on parallel decoding using frame-wise confidence
                  scores},
  booktitle    = {Ninth International Conference on Spoken Language Processing, {INTERSPEECH-ICSLP}
                  2006, Pittsburgh, PA, USA, September 17-21, 2006},
  publisher    = {{ISCA}},
  year         = {2006},
  url          = {https://doi.org/10.21437/Interspeech.2006-457},
  doi          = {10.21437/INTERSPEECH.2006-457},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HakamataLNT06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/SainoZNLT06,
  author       = {Keijiro Saino and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Akinobu Lee and
                  Keiichi Tokuda},
  title        = {An HMM-based singing voice synthesis system},
  booktitle    = {Ninth International Conference on Spoken Language Processing, {INTERSPEECH-ICSLP}
                  2006, Pittsburgh, PA, USA, September 17-21, 2006},
  publisher    = {{ISCA}},
  year         = {2006},
  url          = {https://doi.org/10.21437/Interspeech.2006-584},
  doi          = {10.21437/INTERSPEECH.2006-584},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SainoZNLT06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/UtoNTLT06,
  author       = {Yosuke Uto and
                  Yoshihiko Nankaku and
                  Tomoki Toda and
                  Akinobu Lee and
                  Keiichi Tokuda},
  title        = {Voice conversion based on mixtures of factor analyzers},
  booktitle    = {Ninth International Conference on Spoken Language Processing, {INTERSPEECH-ICSLP}
                  2006, Pittsburgh, PA, USA, September 17-21, 2006},
  publisher    = {{ISCA}},
  year         = {2006},
  url          = {https://doi.org/10.21437/Interspeech.2006-585},
  doi          = {10.21437/INTERSPEECH.2006-585},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/UtoNTLT06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/ZenNTK06,
  author       = {Heiga Zen and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda and
                  Tadashi Kitamura},
  title        = {Speaker adaptation of trajectory HMMs using feature-space {MLLR}},
  booktitle    = {Ninth International Conference on Spoken Language Processing, {INTERSPEECH-ICSLP}
                  2006, Pittsburgh, PA, USA, September 17-21, 2006},
  publisher    = {{ISCA}},
  year         = {2006},
  url          = {https://doi.org/10.21437/Interspeech.2006-348},
  doi          = {10.21437/INTERSPEECH.2006-348},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ZenNTK06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ieicet/LimaZNTKR05,
  author       = {Amaro A. de Lima and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda and
                  Tadashi Kitamura and
                  Fernando Gil Resende},
  title        = {Applying Sparse {KPCA} for Feature Extraction in Speech Recognition},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {88-D},
  number       = {3},
  pages        = {401--409},
  year         = {2005},
  url          = {http://search.ieice.org/bin/summary.php?id=e88-d\_3\_401\&\#38;category=D\&\#38;year=2005\&\#38;lang=E\&\#38;abst=},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ieicet/LimaZNTKR05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ieicet/SuzukiZNMTK05,
  author       = {Hiroyuki Suzuki and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Chiyomi Miyajima and
                  Keiichi Tokuda and
                  Tadashi Kitamura},
  title        = {Continuous Speech Recognition Based on General Factor Dependent Acoustic
                  Models},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {88-D},
  number       = {3},
  pages        = {410--417},
  year         = {2005},
  url          = {http://search.ieice.org/bin/summary.php?id=e88-d\_3\_410\&\#38;category=D\&\#38;year=2005\&\#38;lang=E\&\#38;abst=},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/SuzukiZNMTK05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ieicet/YamamotoNMTK05,
  author       = {Hiroyoshi Yamamoto and
                  Yoshihiko Nankaku and
                  Chiyomi Miyajima and
                  Keiichi Tokuda and
                  Tadashi Kitamura},
  title        = {Parameter Sharing in Mixture of Factor Analyzers for Speaker Identification},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {88-D},
  number       = {3},
  pages        = {418--424},
  year         = {2005},
  url          = {http://search.ieice.org/bin/summary.php?id=e88-d\_3\_418\&\#38;category=D\&\#38;year=2005\&\#38;lang=E\&\#38;abst=},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/YamamotoNMTK05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ieicet/ItayaZNMTK05,
  author       = {Yohei Itaya and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Chiyomi Miyajima and
                  Keiichi Tokuda and
                  Tadashi Kitamura},
  title        = {Deterministic Annealing {EM} Algorithm in Acoustic Modeling for Speaker
                  and Speech Recognition},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {88-D},
  number       = {3},
  pages        = {425--431},
  year         = {2005},
  url          = {http://search.ieice.org/bin/summary.php?id=e88-d\_3\_425\&\#38;category=D\&\#38;year=2005\&\#38;lang=E\&\#38;abst=},
  timestamp    = {Sat, 11 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ieicet/ItayaZNMTK05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/LimaZNTKR05,
  author       = {Amaro A. de Lima and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Keiichi Tokuda and
                  Tadashi Kitamura and
                  Fernando Gil Resende},
  title        = {Sparse {KPCA} for Feature Extraction in Speech Recognition},
  booktitle    = {2005 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} '05, Philadelphia, Pennsylvania, USA, March 18-23,
                  2005},
  pages        = {353--356},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://doi.org/10.1109/ICASSP.2005.1415123},
  doi          = {10.1109/ICASSP.2005.1415123},
  timestamp    = {Sun, 06 Oct 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/LimaZNTKR05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ieicet/LimaZNMTK04,
  author       = {Amaro A. de Lima and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Chiyomi Miyajima and
                  Keiichi Tokuda and
                  Tadashi Kitamura},
  title        = {On the Use of Kernel {PCA} for Feature Extraction in Speech Recognition},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {87-D},
  number       = {12},
  pages        = {2802--2811},
  year         = {2004},
  url          = {http://search.ieice.org/bin/summary.php?id=e87-d\_12\_2802},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ieicet/LimaZNMTK04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/YamamotoNMTK04,
  author       = {Hiroyoshi Yamamoto and
                  Yoshihiko Nankaku and
                  Chiyomi Miyajima and
                  Keiichi Tokuda and
                  Tadashi Kitamura},
  title        = {Parameter sharing and minimum classification error training of mixtures
                  of factor analyzers for speaker identification},
  booktitle    = {2004 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} 2004, Montreal, Quebec, Canada, May 17-21, 2004},
  pages        = {29--32},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://doi.org/10.1109/ICASSP.2004.1325914},
  doi          = {10.1109/ICASSP.2004.1325914},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/YamamotoNMTK04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/ItayaZNMTK04,
  author       = {Yohei Itaya and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Chiyomi Miyajima and
                  Keiichi Tokuda and
                  Tadashi Kitamura},
  title        = {Deterministic annealing {EM} algorithm in parameter estimation for
                  acoustic model},
  booktitle    = {8th International Conference on Spoken Language Processing, {INTERSPEECH-ICSLP}
                  2004, Jeju Island, Korea, October 4-8, 2004},
  pages        = {433--436},
  publisher    = {{ISCA}},
  year         = {2004},
  url          = {https://doi.org/10.21437/Interspeech.2004-176},
  doi          = {10.21437/INTERSPEECH.2004-176},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ItayaZNMTK04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icassp/SuzukiZNMTK03,
  author       = {Hiroyuki Suzuki and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Chiyomi Miyajima and
                  Keiichi Tokuda and
                  Tadashi Kitamura},
  title        = {Speech recognition using voice-characteristic-dependent acoustic models},
  booktitle    = {2003 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} '03, Hong Kong, April 6-10, 2003},
  pages        = {740--743},
  publisher    = {{IEEE}},
  year         = {2003},
  url          = {https://doi.org/10.1109/ICASSP.2003.1198887},
  doi          = {10.1109/ICASSP.2003.1198887},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/SuzukiZNMTK03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/LimaZNMTK03,
  author       = {Amaro A. de Lima and
                  Heiga Zen and
                  Yoshihiko Nankaku and
                  Chiyomi Miyajima and
                  Keiichi Tokuda and
                  Tadashi Kitamura},
  title        = {On the use of kernel {PCA} for feature extraction in speech recognition},
  booktitle    = {8th European Conference on Speech Communication and Technology, {EUROSPEECH}
                  2003 - {INTERSPEECH} 2003, Geneva, Switzerland, September 1-4, 2003},
  pages        = {2625--2628},
  publisher    = {{ISCA}},
  year         = {2003},
  url          = {https://doi.org/10.21437/Eurospeech.2003-704},
  doi          = {10.21437/EUROSPEECH.2003-704},
  timestamp    = {Thu, 22 Jun 2023 16:42:17 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/LimaZNMTK03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icip/NankakuTKK00,
  author       = {Yoshihiko Nankaku and
                  Keiichi Tokuda and
                  Tadashi Kitamura and
                  Takao Kobayashi},
  title        = {Normalized Training for HMM-Based Visual Speech Recognition},
  booktitle    = {Proceedings of the 2000 International Conference on Image Processing,
                  {ICIP} 2000, Vancouver, BC, Canada, September 10-13, 2000},
  pages        = {234--237},
  publisher    = {{IEEE}},
  year         = {2000},
  url          = {https://doi.org/10.1109/ICIP.2000.899338},
  doi          = {10.1109/ICIP.2000.899338},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icip/NankakuTKK00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/interspeech/NankakuTK99,
  author       = {Yoshihiko Nankaku and
                  Keiichi Tokuda and
                  Tadashi Kitamura},
  title        = {Intensity- and location-normalized training for HMM-based visual speech
                  recognition},
  booktitle    = {Sixth European Conference on Speech Communication and Technology,
                  {EUROSPEECH} 1999, Budapest, Hungary, September 5-9, 1999},
  pages        = {1287--1290},
  publisher    = {{ISCA}},
  year         = {1999},
  url          = {https://doi.org/10.21437/Eurospeech.1999-329},
  doi          = {10.21437/EUROSPEECH.1999-329},
  timestamp    = {Wed, 18 Sep 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/NankakuTK99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

manage site settings

To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.