default search action
BibTeX records: Yoshihiko Nankaku
@article{DBLP:journals/access/FujimotoHNT25,
author = {Takato Fujimoto and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {V2Coder: {A} Non-Autoregressive Vocoder Based on Hierarchical Variational
Autoencoders},
journal = {{IEEE} Access},
volume = {13},
pages = {92833--92847},
year = {2025},
url = {https://doi.org/10.1109/ACCESS.2025.3572904},
doi = {10.1109/ACCESS.2025.3572904},
timestamp = {Sun, 06 Jul 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/access/FujimotoHNT25.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HonoHNT24,
author = {Yukiya Hono and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {PeriodGrad: Towards Pitch-Controllable Neural Vocoder Based on a Diffusion
Probabilistic Model},
booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
{ICASSP} 2024, Seoul, Republic of Korea, April 14-19, 2024},
pages = {12782--12786},
publisher = {{IEEE}},
year = {2024},
url = {https://doi.org/10.1109/ICASSP48485.2024.10448502},
doi = {10.1109/ICASSP48485.2024.10448502},
timestamp = {Sun, 19 Jan 2025 13:18:23 +0100},
biburl = {https://dblp.org/rec/conf/icassp/HonoHNT24.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-14692,
author = {Yukiya Hono and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {PeriodGrad: Towards Pitch-Controllable Neural Vocoder Based on a Diffusion
Probabilistic Model},
journal = {CoRR},
volume = {abs/2402.14692},
year = {2024},
url = {https://doi.org/10.48550/arXiv.2402.14692},
doi = {10.48550/ARXIV.2402.14692},
eprinttype = {arXiv},
eprint = {2402.14692},
timestamp = {Fri, 22 Mar 2024 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/corr/abs-2402-14692.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HonoHNT23,
author = {Yukiya Hono and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Singing Voice Synthesis Based on a Musical Note Position-Aware Attention
Mechanism},
booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
{ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
pages = {1--5},
publisher = {{IEEE}},
year = {2023},
url = {https://doi.org/10.1109/ICASSP49357.2023.10095919},
doi = {10.1109/ICASSP49357.2023.10095919},
timestamp = {Sun, 19 Jan 2025 13:18:24 +0100},
biburl = {https://dblp.org/rec/conf/icassp/HonoHNT23.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/YoshimuraTNOHHNT23,
author = {Takenori Yoshimura and
Shinji Takaki and
Kazuhiro Nakamura and
Keiichiro Oura and
Yukiya Hono and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Embedding a Differentiable Mel-Cepstral Synthesis Filter to a Neural
Speech Synthesis System},
booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
{ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
pages = {1--5},
publisher = {{IEEE}},
year = {2023},
url = {https://doi.org/10.1109/ICASSP49357.2023.10094872},
doi = {10.1109/ICASSP49357.2023.10094872},
timestamp = {Sun, 05 Nov 2023 00:00:00 +0100},
biburl = {https://dblp.org/rec/conf/icassp/YoshimuraTNOHHNT23.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-02262,
author = {Miku Nishihara and
Yukiya Hono and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Singing voice synthesis based on frame-level sequence-to-sequence
models considering vocal timing deviation},
journal = {CoRR},
volume = {abs/2301.02262},
year = {2023},
url = {https://doi.org/10.48550/arXiv.2301.02262},
doi = {10.48550/ARXIV.2301.02262},
eprinttype = {arXiv},
eprint = {2301.02262},
timestamp = {Tue, 10 Jan 2023 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/corr/abs-2301-02262.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/gcce/NakamuraHSTNK22,
author = {Yasutaka Nakamura and
Seiichi Harata and
Takuto Sakuma and
Yoshihiro Tanaka and
Yoshihiko Nankaku and
Shohei Kato},
title = {Enhancing Social Telepresence on Text Communication Using Robot Avatar
that Reflects User's Chatting States},
booktitle = {11th {IEEE} Global Conference on Consumer Electronics, {GCCE} 2022,
Osaka, Japan, October 18-21, 2022},
pages = {707--709},
publisher = {{IEEE}},
year = {2022},
url = {https://doi.org/10.1109/GCCE56475.2022.10014193},
doi = {10.1109/GCCE56475.2022.10014193},
timestamp = {Tue, 07 May 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/gcce/NakamuraHSTNK22.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/FujimotoHNT22,
author = {Takato Fujimoto and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Autoregressive Variational Autoencoder with a Hidden Semi-Markov Model-Based
Structured Attention for Speech Synthesis},
booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
{ICASSP} 2022, Virtual and Singapore, 23-27 May 2022},
pages = {7462--7466},
publisher = {{IEEE}},
year = {2022},
url = {https://doi.org/10.1109/ICASSP43922.2022.9746158},
doi = {10.1109/ICASSP43922.2022.9746158},
timestamp = {Tue, 07 Jun 2022 17:34:47 +0200},
biburl = {https://dblp.org/rec/conf/icassp/FujimotoHNT22.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/MitsuiZSHNT22,
author = {Kentaro Mitsui and
Tianyu Zhao and
Kei Sawada and
Yukiya Hono and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Hanseok Ko and
John H. L. Hansen},
title = {End-to-End Text-to-Speech Based on Latent Representation of Speaking
Styles Using Spontaneous Dialogue},
booktitle = {23rd Annual Conference of the International Speech Communication Association,
Interspeech 2022, Incheon, Korea, September 18-22, 2022},
pages = {2328--2332},
publisher = {{ISCA}},
year = {2022},
url = {https://doi.org/10.21437/Interspeech.2022-259},
doi = {10.21437/INTERSPEECH.2022-259},
timestamp = {Tue, 17 Jun 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/MitsuiZSHNT22.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-12040,
author = {Kentaro Mitsui and
Tianyu Zhao and
Kei Sawada and
Yukiya Hono and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {End-to-End Text-to-Speech Based on Latent Representation of Speaking
Styles Using Spontaneous Dialogue},
journal = {CoRR},
volume = {abs/2206.12040},
year = {2022},
url = {https://doi.org/10.48550/arXiv.2206.12040},
doi = {10.48550/ARXIV.2206.12040},
eprinttype = {arXiv},
eprint = {2206.12040},
timestamp = {Tue, 17 Jun 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2206-12040.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-11222,
author = {Takenori Yoshimura and
Shinji Takaki and
Kazuhiro Nakamura and
Keiichiro Oura and
Yukiya Hono and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Embedding a Differentiable Mel-cepstral Synthesis Filter to a Neural
Speech Synthesis System},
journal = {CoRR},
volume = {abs/2211.11222},
year = {2022},
url = {https://doi.org/10.48550/arXiv.2211.11222},
doi = {10.48550/ARXIV.2211.11222},
eprinttype = {arXiv},
eprint = {2211.11222},
timestamp = {Thu, 24 Nov 2022 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/corr/abs-2211-11222.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-13703,
author = {Yukiya Hono and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Singing Voice Synthesis Based on a Musical Note Position-Aware Attention
Mechanism},
journal = {CoRR},
volume = {abs/2212.13703},
year = {2022},
url = {https://doi.org/10.48550/arXiv.2212.13703},
doi = {10.48550/ARXIV.2212.13703},
eprinttype = {arXiv},
eprint = {2212.13703},
timestamp = {Mon, 02 Jan 2023 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/corr/abs-2212-13703.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/access/HonoTHONT21,
author = {Yukiya Hono and
Shinji Takaki and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {PeriodNet: {A} Non-Autoregressive Raw Waveform Generative Model With
a Structure Separating Periodic and Aperiodic Components},
journal = {{IEEE} Access},
volume = {9},
pages = {137599--137612},
year = {2021},
url = {https://doi.org/10.1109/ACCESS.2021.3118033},
doi = {10.1109/ACCESS.2021.3118033},
timestamp = {Wed, 03 Nov 2021 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/access/HonoTHONT21.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/HonoHONT21,
author = {Yukiya Hono and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Sinsy: {A} Deep Neural Network-Based Singing Voice Synthesis System},
journal = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
volume = {29},
pages = {2803--2815},
year = {2021},
url = {https://doi.org/10.1109/TASLP.2021.3104165},
doi = {10.1109/TASLP.2021.3104165},
timestamp = {Sun, 19 Jan 2025 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/taslp/HonoHONT21.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HonoTHONT21,
author = {Yukiya Hono and
Shinji Takaki and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Periodnet: {A} Non-Autoregressive Waveform Generation Model with a
Structure Separating Periodic and Aperiodic Components},
booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
{ICASSP} 2021, Toronto, ON, Canada, June 6-11, 2021},
pages = {6049--6053},
publisher = {{IEEE}},
year = {2021},
url = {https://doi.org/10.1109/ICASSP39728.2021.9414401},
doi = {10.1109/ICASSP39728.2021.9414401},
timestamp = {Fri, 09 Jul 2021 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/HonoTHONT21.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-07786,
author = {Yukiya Hono and
Shinji Takaki and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {PeriodNet: {A} non-autoregressive waveform generation model with a
structure separating periodic and aperiodic components},
journal = {CoRR},
volume = {abs/2102.07786},
year = {2021},
url = {https://arxiv.org/abs/2102.07786},
eprinttype = {arXiv},
eprint = {2102.07786},
timestamp = {Fri, 19 Feb 2021 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/corr/abs-2102-07786.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2108-02776,
author = {Yukiya Hono and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Sinsy: {A} Deep Neural Network-Based Singing Voice Synthesis System},
journal = {CoRR},
volume = {abs/2108.02776},
year = {2021},
url = {https://arxiv.org/abs/2108.02776},
eprinttype = {arXiv},
eprint = {2108.02776},
timestamp = {Wed, 11 Aug 2021 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2108-02776.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/NakamuraTHONT20,
author = {Kazuhiro Nakamura and
Shinji Takaki and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Fast and High-Quality Singing Voice Synthesis System Based on Convolutional
Neural Networks},
booktitle = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
pages = {7239--7243},
publisher = {{IEEE}},
year = {2020},
url = {https://doi.org/10.1109/ICASSP40776.2020.9053811},
doi = {10.1109/ICASSP40776.2020.9053811},
timestamp = {Thu, 23 Jul 2020 16:19:28 +0200},
biburl = {https://dblp.org/rec/conf/icassp/NakamuraTHONT20.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/FujimotoTHONT20,
author = {Takato Fujimoto and
Shinji Takaki and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Semi-Supervised Learning Based on Hierarchical Generative Models for
End-to-End Speech Synthesis},
booktitle = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
pages = {7644--7648},
publisher = {{IEEE}},
year = {2020},
url = {https://doi.org/10.1109/ICASSP40776.2020.9054466},
doi = {10.1109/ICASSP40776.2020.9054466},
timestamp = {Thu, 23 Jul 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/FujimotoTHONT20.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HonoTSHONT20,
author = {Yukiya Hono and
Kazuna Tsuboi and
Kei Sawada and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Helen Meng and
Bo Xu and
Thomas Fang Zheng},
title = {Hierarchical Multi-Grained Generative Model for Expressive Speech
Synthesis},
booktitle = {21st Annual Conference of the International Speech Communication Association,
Interspeech 2020, Virtual Event, Shanghai, China, October 25-29, 2020},
pages = {3441--3445},
publisher = {{ISCA}},
year = {2020},
url = {https://doi.org/10.21437/Interspeech.2020-2477},
doi = {10.21437/INTERSPEECH.2020-2477},
timestamp = {Sun, 19 Jan 2025 13:13:53 +0100},
biburl = {https://dblp.org/rec/conf/interspeech/HonoTSHONT20.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-08474,
author = {Yukiya Hono and
Kazuna Tsuboi and
Kei Sawada and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Hierarchical Multi-Grained Generative Model for Expressive Speech
Synthesis},
journal = {CoRR},
volume = {abs/2009.08474},
year = {2020},
url = {https://arxiv.org/abs/2009.08474},
eprinttype = {arXiv},
eprint = {2009.08474},
timestamp = {Wed, 23 Sep 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2009-08474.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HonoHONT19,
author = {Yukiya Hono and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Singing Voice Synthesis Based on Generative Adversarial Networks},
booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
{ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019},
pages = {6955--6959},
publisher = {{IEEE}},
year = {2019},
url = {https://doi.org/10.1109/ICASSP.2019.8683154},
doi = {10.1109/ICASSP.2019.8683154},
timestamp = {Wed, 16 Oct 2019 14:14:52 +0200},
biburl = {https://dblp.org/rec/conf/icassp/HonoHONT19.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/YoshimuraHONT19,
author = {Takenori Yoshimura and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Speaker-dependent Wavenet-based Delay-free Adpcm Speech Coding},
booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
{ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019},
pages = {7145--7149},
publisher = {{IEEE}},
year = {2019},
url = {https://doi.org/10.1109/ICASSP.2019.8682264},
doi = {10.1109/ICASSP.2019.8682264},
timestamp = {Sun, 30 Jun 2019 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/YoshimuraHONT19.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/OuraNHNT19,
author = {Keiichiro Oura and
Kazuhiro Nakamura and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Michael Pucher},
title = {Deep neural network based real-time speech vocoder with periodic and
aperiodic inputs},
booktitle = {10th {ISCA} Speech Synthesis Workshop, {SSW} 2019, Vienna, Austria,
September 20-22, 2019},
pages = {13--18},
publisher = {{ISCA}},
year = {2019},
url = {https://doi.org/10.21437/SSW.2019-3},
doi = {10.21437/SSW.2019-3},
timestamp = {Wed, 31 Jul 2024 13:04:37 +0200},
biburl = {https://dblp.org/rec/conf/ssw/OuraNHNT19.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/FujimotoHONT19,
author = {Takato Fujimoto and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Michael Pucher},
title = {Impacts of input linguistic feature representation on Japanese end-to-end
speech synthesis},
booktitle = {10th {ISCA} Speech Synthesis Workshop, {SSW} 2019, Vienna, Austria,
September 20-22, 2019},
pages = {166--171},
publisher = {{ISCA}},
year = {2019},
url = {https://doi.org/10.21437/SSW.2019-30},
doi = {10.21437/SSW.2019-30},
timestamp = {Wed, 31 Jul 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/ssw/FujimotoHONT19.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/ShimadaHONT19,
author = {Motoki Shimada and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Michael Pucher},
title = {Low computational cost speech synthesis based on deep neural networks
using hidden semi-Markov model structures},
booktitle = {10th {ISCA} Speech Synthesis Workshop, {SSW} 2019, Vienna, Austria,
September 20-22, 2019},
pages = {177--182},
publisher = {{ISCA}},
year = {2019},
url = {https://doi.org/10.21437/SSW.2019-32},
doi = {10.21437/SSW.2019-32},
timestamp = {Wed, 31 Jul 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/ssw/ShimadaHONT19.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-06868,
author = {Kazuhiro Nakamura and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Singing voice synthesis based on convolutional neural networks},
journal = {CoRR},
volume = {abs/1904.06868},
year = {2019},
url = {http://arxiv.org/abs/1904.06868},
eprinttype = {arXiv},
eprint = {1904.06868},
timestamp = {Sat, 27 Apr 2019 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-1904-06868.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-11690,
author = {Kazuhiro Nakamura and
Shinji Takaki and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Fast and High-Quality Singing Voice Synthesis System based on Convolutional
Neural Networks},
journal = {CoRR},
volume = {abs/1910.11690},
year = {2019},
url = {http://arxiv.org/abs/1910.11690},
eprinttype = {arXiv},
eprint = {1910.11690},
timestamp = {Thu, 31 Oct 2019 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/corr/abs-1910-11690.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/YoshimuraHONT18,
author = {Takenori Yoshimura and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Mel-Cepstrum-Based Quantization Noise Shaping Applied to Neural-Network-Based
Speech Waveform Synthesis},
journal = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
volume = {26},
number = {7},
pages = {1173--1180},
year = {2018},
url = {https://doi.org/10.1109/TASLP.2018.2818408},
doi = {10.1109/TASLP.2018.2818408},
timestamp = {Sun, 19 Jan 2025 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/taslp/YoshimuraHONT18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/KasugaiTSHONT18,
author = {Takayuki Kasugai and
Yoshinari Tsuzuki and
Kei Sawada and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Image Recognition Based on Convolutional Neural Networks Using Features
Generated from Separable Lattice Hidden Markov Models},
booktitle = {Asia-Pacific Signal and Information Processing Association Annual
Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
12-15, 2018},
pages = {324--328},
publisher = {{IEEE}},
year = {2018},
url = {https://doi.org/10.23919/APSIPA.2018.8659518},
doi = {10.23919/APSIPA.2018.8659518},
timestamp = {Wed, 16 Oct 2019 14:14:55 +0200},
biburl = {https://dblp.org/rec/conf/apsipa/KasugaiTSHONT18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/NakaoHONT18,
author = {Kento Nakao and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Speaker Adaptation for Speech Synthesis Based on Deep Neural Networks
Using Hidden Semi-Markov Model Structures},
booktitle = {Asia-Pacific Signal and Information Processing Association Annual
Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
12-15, 2018},
pages = {638--643},
publisher = {{IEEE}},
year = {2018},
url = {https://doi.org/10.23919/APSIPA.2018.8659791},
doi = {10.23919/APSIPA.2018.8659791},
timestamp = {Sat, 09 Mar 2019 00:00:00 +0100},
biburl = {https://dblp.org/rec/conf/apsipa/NakaoHONT18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/FujimotoYHONT18,
author = {Takato Fujimoto and
Takenori Yoshimura and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Speech Synthesis Using WaveNet Vocoder Based on Periodic/Aperiodic
Decomposition},
booktitle = {Asia-Pacific Signal and Information Processing Association Annual
Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
12-15, 2018},
pages = {644--648},
publisher = {{IEEE}},
year = {2018},
url = {https://doi.org/10.23919/APSIPA.2018.8659541},
doi = {10.23919/APSIPA.2018.8659541},
timestamp = {Sat, 09 Mar 2019 00:00:00 +0100},
biburl = {https://dblp.org/rec/conf/apsipa/FujimotoYHONT18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/HonoMNHONT18,
author = {Yukiya Hono and
Shumma Murata and
Kazuhiro Nakamura and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Recent Development of the DNN-based Singing Voice Synthesis System
- Sinsy},
booktitle = {Asia-Pacific Signal and Information Processing Association Annual
Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
12-15, 2018},
pages = {1003--1009},
publisher = {{IEEE}},
year = {2018},
url = {https://doi.org/10.23919/APSIPA.2018.8659797},
doi = {10.23919/APSIPA.2018.8659797},
timestamp = {Sat, 09 Mar 2019 00:00:00 +0100},
biburl = {https://dblp.org/rec/conf/apsipa/HonoMNHONT18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/YoshimuraKHONT18,
author = {Takenori Yoshimura and
Natsumi Koike and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Discriminative Feature Extraction Based on Sequential Variational
Autoencoder for Speaker Recognition},
booktitle = {Asia-Pacific Signal and Information Processing Association Annual
Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
12-15, 2018},
pages = {1742--1746},
publisher = {{IEEE}},
year = {2018},
url = {https://doi.org/10.23919/APSIPA.2018.8659722},
doi = {10.23919/APSIPA.2018.8659722},
timestamp = {Sat, 09 Mar 2019 00:00:00 +0100},
biburl = {https://dblp.org/rec/conf/apsipa/YoshimuraKHONT18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/SendaHSHONT18,
author = {Koki Senda and
Yukiya Hono and
Kei Sawada and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Singing Voice Conversion Using Posted Waveform Data on Music Social
Media},
booktitle = {Asia-Pacific Signal and Information Processing Association Annual
Summit and Conference, {APSIPA} {ASC} 2018, Honolulu, HI, USA, November
12-15, 2018},
pages = {1913--1917},
publisher = {{IEEE}},
year = {2018},
url = {https://doi.org/10.23919/APSIPA.2018.8659568},
doi = {10.23919/APSIPA.2018.8659568},
timestamp = {Sat, 09 Mar 2019 00:00:00 +0100},
biburl = {https://dblp.org/rec/conf/apsipa/SendaHSHONT18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/blizzard/SawadaYHONT18,
author = {Kei Sawada and
Takenori Yoshimura and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {The NITech text-to-speech system for the Blizzard Challenge 2018},
booktitle = {The Blizzard Challenge 2018, Hyderabad, India, September 8, 2018},
publisher = {{ISCA}},
year = {2018},
url = {https://doi.org/10.21437/Blizzard.2018-7},
doi = {10.21437/BLIZZARD.2018-7},
timestamp = {Fri, 20 Sep 2024 10:08:07 +0200},
biburl = {https://dblp.org/rec/conf/blizzard/SawadaYHONT18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/IchikawaSHNT18,
author = {Eiji Ichikawa and
Kei Sawada and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Image Recognition Based on Separable Lattice Hmms Using a Deep Neural
Network for Output Probability Distributions},
booktitle = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
pages = {3021--3025},
publisher = {{IEEE}},
year = {2018},
url = {https://doi.org/10.1109/ICASSP.2018.8461784},
doi = {10.1109/ICASSP.2018.8461784},
timestamp = {Wed, 16 Oct 2019 14:14:52 +0200},
biburl = {https://dblp.org/rec/conf/icassp/IchikawaSHNT18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/NiwaYHONT18,
author = {Jumpei Niwa and
Takenori Yoshimura and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Statistical Voice Conversion Based on Wavenet},
booktitle = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
pages = {5289--5293},
publisher = {{IEEE}},
year = {2018},
url = {https://doi.org/10.1109/ICASSP.2018.8461948},
doi = {10.1109/ICASSP.2018.8461948},
timestamp = {Tue, 18 Sep 2018 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/NiwaYHONT18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/YoshimuraHONT18,
author = {Takenori Yoshimura and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {WaveNet-Based Zero-Delay Lossless Speech Coding},
booktitle = {2018 {IEEE} Spoken Language Technology Workshop, {SLT} 2018, Athens,
Greece, December 18-21, 2018},
pages = {153--158},
publisher = {{IEEE}},
year = {2018},
url = {https://doi.org/10.1109/SLT.2018.8639598},
doi = {10.1109/SLT.2018.8639598},
timestamp = {Wed, 16 Oct 2019 14:14:53 +0200},
biburl = {https://dblp.org/rec/conf/slt/YoshimuraHONT18.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/YoshimuraHONT17,
author = {Takenori Yoshimura and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Simultaneous Optimization of Multiple Tree-Based Factor Analyzed {HMM}
for Speech Synthesis},
journal = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
volume = {25},
number = {9},
pages = {1836--1845},
year = {2017},
url = {https://doi.org/10.1109/TASLP.2017.2721219},
doi = {10.1109/TASLP.2017.2721219},
timestamp = {Fri, 13 Mar 2020 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/taslp/YoshimuraHONT17.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TsuzukiSHNT17,
author = {Yoshinari Tsuzuki and
Kei Sawada and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Image recognition based on discriminative models using features generated
from separable lattice {HMMS}},
booktitle = {2017 {IEEE} International Conference on Acoustics, Speech and Signal
Processing, {ICASSP} 2017, New Orleans, LA, USA, March 5-9, 2017},
pages = {2607--2611},
publisher = {{IEEE}},
year = {2017},
url = {https://doi.org/10.1109/ICASSP.2017.7952628},
doi = {10.1109/ICASSP.2017.7952628},
timestamp = {Wed, 16 Oct 2019 14:14:52 +0200},
biburl = {https://dblp.org/rec/conf/icassp/TsuzukiSHNT17.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/GullyYMHNT17,
author = {Amelia Jane Gully and
Takenori Yoshimura and
Damian T. Murphy and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Francisco Lacerda},
title = {Articulatory Text-to-Speech Synthesis Using the Digital Waveguide
Mesh Driven by a Deep Neural Network},
booktitle = {18th Annual Conference of the International Speech Communication Association,
Interspeech 2017, Stockholm, Sweden, August 20-24, 2017},
pages = {234--238},
publisher = {{ISCA}},
year = {2017},
url = {https://doi.org/10.21437/Interspeech.2017-900},
doi = {10.21437/INTERSPEECH.2017-900},
timestamp = {Tue, 11 Jun 2024 16:45:43 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/GullyYMHNT17.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/sp/17/TokudaLNOHYTUTRY17,
author = {Keiichi Tokuda and
Akinobu Lee and
Yoshihiko Nankaku and
Keiichiro Oura and
Kei Hashimoto and
Daisuke Yamamoto and
Ichi Takumi and
Takahiro Uchiya and
Shuhei Tsutsumi and
Steve Renals and
Junichi Yamagishi},
editor = {Toyoaki Nishida},
title = {User Generated Dialogue Systems: uDialogue},
booktitle = {Human-Harmonized Information Technology, Volume 2, Horizontal Expansion},
pages = {77--114},
publisher = {Springer},
year = {2017},
url = {https://doi.org/10.1007/978-4-431-56535-2\_3},
doi = {10.1007/978-4-431-56535-2\_3},
timestamp = {Wed, 12 Feb 2020 00:00:00 +0100},
biburl = {https://dblp.org/rec/books/sp/17/TokudaLNOHYTUTRY17.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/SawadaTHNT16,
author = {Kei Sawada and
Akira Tamamori and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {A Bayesian Approach to Image Recognition Based on Separable Lattice
Hidden Markov Models},
journal = {{IEICE} Trans. Inf. Syst.},
volume = {99-D},
number = {12},
pages = {3119--3131},
year = {2016},
url = {https://doi.org/10.1587/transinf.2016EDP7112},
doi = {10.1587/TRANSINF.2016EDP7112},
timestamp = {Sat, 11 Apr 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/ieicet/SawadaTHNT16.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HashimotoONT16,
author = {Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Trajectory training considering global variance for speech synthesis
based on neural networks},
booktitle = {2016 {IEEE} International Conference on Acoustics, Speech and Signal
Processing, {ICASSP} 2016, Shanghai, China, March 20-25, 2016},
pages = {5600--5604},
publisher = {{IEEE}},
year = {2016},
url = {https://doi.org/10.1109/ICASSP.2016.7472749},
doi = {10.1109/ICASSP.2016.7472749},
timestamp = {Wed, 16 Oct 2019 14:14:52 +0200},
biburl = {https://dblp.org/rec/conf/icassp/HashimotoONT16.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HosakaHONT16,
author = {Naoki Hosaka and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Nelson Morgan},
title = {Voice Conversion Based on Trajectory Model Training of Neural Networks
Considering Global Variance},
booktitle = {17th Annual Conference of the International Speech Communication Association,
Interspeech 2016, San Francisco, CA, USA, September 8-12, 2016},
pages = {307--311},
publisher = {{ISCA}},
year = {2016},
url = {https://doi.org/10.21437/Interspeech.2016-1035},
doi = {10.21437/INTERSPEECH.2016-1035},
timestamp = {Tue, 11 Jun 2024 16:45:43 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/HosakaHONT16.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/NishimuraHONT16,
author = {Masanari Nishimura and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Nelson Morgan},
title = {Singing Voice Synthesis Based on Deep Neural Networks},
booktitle = {17th Annual Conference of the International Speech Communication Association,
Interspeech 2016, San Francisco, CA, USA, September 8-12, 2016},
pages = {2478--2482},
publisher = {{ISCA}},
year = {2016},
url = {https://doi.org/10.21437/Interspeech.2016-1027},
doi = {10.21437/INTERSPEECH.2016-1027},
timestamp = {Fri, 29 Jan 2021 00:00:00 +0100},
biburl = {https://dblp.org/rec/conf/interspeech/NishimuraHONT16.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/DallHONT16,
author = {Rasmus Dall and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Nelson Morgan},
title = {Redefining the Linguistic Context Feature Set for {HMM} and {DNN}
{TTS} Through Position and Parsing},
booktitle = {17th Annual Conference of the International Speech Communication Association,
Interspeech 2016, San Francisco, CA, USA, September 8-12, 2016},
pages = {2851--2855},
publisher = {{ISCA}},
year = {2016},
url = {https://doi.org/10.21437/Interspeech.2016-399},
doi = {10.21437/INTERSPEECH.2016-399},
timestamp = {Fri, 29 Jan 2021 00:00:00 +0100},
biburl = {https://dblp.org/rec/conf/interspeech/DallHONT16.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/TokudaHON16,
author = {Keiichi Tokuda and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku},
editor = {Alan W. Black},
title = {Temporal modeling in neural network based statistical parametric speech
synthesis},
booktitle = {The 9th {ISCA} Speech Synthesis Workshop, {SSW} 2016, Sunnyvale, CA,
USA, September 13-15, 2016},
pages = {106--111},
publisher = {{ISCA}},
year = {2016},
url = {https://doi.org/10.21437/SSW.2016-18},
doi = {10.21437/SSW.2016-18},
timestamp = {Wed, 31 Jul 2024 11:28:11 +0200},
biburl = {https://dblp.org/rec/conf/ssw/TokudaHON16.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HashimotoONT15,
author = {Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {The effect of neural networks in statistical parametric speech synthesis},
booktitle = {2015 {IEEE} International Conference on Acoustics, Speech and Signal
Processing, {ICASSP} 2015, South Brisbane, Queensland, Australia,
April 19-24, 2015},
pages = {4455--4459},
publisher = {{IEEE}},
year = {2015},
url = {https://doi.org/10.1109/ICASSP.2015.7178813},
doi = {10.1109/ICASSP.2015.7178813},
timestamp = {Wed, 16 Oct 2019 14:14:52 +0200},
biburl = {https://dblp.org/rec/conf/icassp/HashimotoONT15.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/YoshimuraHNT15,
author = {Takenori Yoshimura and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Simultaneous optimization of multiple tree structures for factor analyzed
HMM-based speech synthesis},
booktitle = {16th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2015, Dresden, Germany, September 6-10, 2015},
pages = {1196--1200},
publisher = {{ISCA}},
year = {2015},
url = {https://doi.org/10.21437/Interspeech.2015-303},
doi = {10.21437/INTERSPEECH.2015-303},
timestamp = {Sun, 19 Jan 2025 13:13:53 +0100},
biburl = {https://dblp.org/rec/conf/interspeech/YoshimuraHNT15.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/GangireddyRNL15,
author = {Siva Reddy Gangireddy and
Steve Renals and
Yoshihiko Nankaku and
Akinobu Lee},
title = {Prosodically-enhanced recurrent neural network language models},
booktitle = {16th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2015, Dresden, Germany, September 6-10, 2015},
pages = {2390--2394},
publisher = {{ISCA}},
year = {2015},
url = {https://doi.org/10.21437/Interspeech.2015-517},
doi = {10.21437/INTERSPEECH.2015-517},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/GangireddyRNL15.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/NakamuraHNT14,
author = {Kazuhiro Nakamura and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Integration of Spectral Feature Extraction and Modeling for HMM-Based
Speech Synthesis},
journal = {{IEICE} Trans. Inf. Syst.},
volume = {97-D},
number = {6},
pages = {1438--1448},
year = {2014},
url = {https://doi.org/10.1587/transinf.E97.D.1438},
doi = {10.1587/TRANSINF.E97.D.1438},
timestamp = {Sat, 11 Apr 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/ieicet/NakamuraHNT14.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/TamamoriNT14,
author = {Akira Tamamori and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Image Recognition Based on Separable Lattice Trajectory 2-D HMMs},
journal = {{IEICE} Trans. Inf. Syst.},
volume = {97-D},
number = {7},
pages = {1842--1854},
year = {2014},
url = {https://doi.org/10.1587/transinf.E97.D.1842},
doi = {10.1587/TRANSINF.E97.D.1842},
timestamp = {Sat, 11 Apr 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/ieicet/TamamoriNT14.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jstsp/TakakiNT14,
author = {Shinji Takaki and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Contextual Additive Structure for HMM-Based Speech Synthesis},
journal = {{IEEE} J. Sel. Top. Signal Process.},
volume = {8},
number = {2},
pages = {229--238},
year = {2014},
url = {https://doi.org/10.1109/JSTSP.2014.2305919},
doi = {10.1109/JSTSP.2014.2305919},
timestamp = {Thu, 09 Jul 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/jstsp/TakakiNT14.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/NakamuraONT14,
author = {Kazuhiro Nakamura and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {HMM-Based singing voice synthesis and its application to Japanese
and English},
booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
{ICASSP} 2014, Florence, Italy, May 4-9, 2014},
pages = {265--269},
publisher = {{IEEE}},
year = {2014},
url = {https://doi.org/10.1109/ICASSP.2014.6853599},
doi = {10.1109/ICASSP.2014.6853599},
timestamp = {Wed, 16 Oct 2019 14:14:52 +0200},
biburl = {https://dblp.org/rec/conf/icassp/NakamuraONT14.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ShirotaNHONT14,
author = {Kanako Shirota and
Kazuhiro Nakamura and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Integration of speaker and pitch adaptive training for HMM-based singing
voice synthesis},
booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
{ICASSP} 2014, Florence, Italy, May 4-9, 2014},
pages = {2559--2563},
publisher = {{IEEE}},
year = {2014},
url = {https://doi.org/10.1109/ICASSP.2014.6854062},
doi = {10.1109/ICASSP.2014.6854062},
timestamp = {Fri, 19 May 2017 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/ShirotaNHONT14.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/NakamuraHONT14,
author = {Kazuhiro Nakamura and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Haizhou Li and
Helen M. Meng and
Bin Ma and
Engsiong Chng and
Lei Xie},
title = {A mel-cepstral analysis technique restoring high frequency components
from low-sampling-rate speech},
booktitle = {15th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2014, Singapore, September 14-18, 2014},
pages = {2494--2498},
publisher = {{ISCA}},
year = {2014},
url = {https://doi.org/10.21437/Interspeech.2014-535},
doi = {10.21437/INTERSPEECH.2014-535},
timestamp = {Tue, 11 Jun 2024 16:45:43 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/NakamuraHONT14.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/ShiotaHNT13,
author = {Sayaka Shiota and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {A Bayesian Framework Using Multiple Model Structures for Speech Recognition},
journal = {{IEICE} Trans. Inf. Syst.},
volume = {96-D},
number = {4},
pages = {939--948},
year = {2013},
url = {https://doi.org/10.1587/transinf.E96.D.939},
doi = {10.1587/TRANSINF.E96.D.939},
timestamp = {Sat, 11 Apr 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/ieicet/ShiotaHNT13.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pieee/TokudaNTZYO13,
author = {Keiichi Tokuda and
Yoshihiko Nankaku and
Tomoki Toda and
Heiga Zen and
Junichi Yamagishi and
Keiichiro Oura},
title = {Speech Synthesis Based on Hidden Markov Models},
journal = {Proc. {IEEE}},
volume = {101},
number = {5},
pages = {1234--1252},
year = {2013},
url = {https://doi.org/10.1109/JPROC.2013.2251852},
doi = {10.1109/JPROC.2013.2251852},
timestamp = {Sun, 06 Oct 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/pieee/TokudaNTZYO13.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apsipa/SawadaHNT13,
author = {Kei Sawada and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Image recognition based on hidden Markov eigen-image models using
variational Bayesian method},
booktitle = {Asia-Pacific Signal and Information Processing Association Annual
Summit and Conference, {APSIPA} 2013, Kaohsiung, Taiwan, October 29
- November 1, 2013},
pages = {1--8},
publisher = {{IEEE}},
year = {2013},
url = {https://doi.org/10.1109/APSIPA.2013.6694382},
doi = {10.1109/APSIPA.2013.6694382},
timestamp = {Wed, 16 Oct 2019 14:14:55 +0200},
biburl = {https://dblp.org/rec/conf/apsipa/SawadaHNT13.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MakinoTHNT13,
author = {Takaya Makino and
Shinji Takaki and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Separable lattice 2-D {HMMS} introducing state duration control for
recognition of images with various variations},
booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
{ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
pages = {3203--3207},
publisher = {{IEEE}},
year = {2013},
url = {https://doi.org/10.1109/ICASSP.2013.6638249},
doi = {10.1109/ICASSP.2013.6638249},
timestamp = {Wed, 16 Oct 2019 14:14:52 +0200},
biburl = {https://dblp.org/rec/conf/icassp/MakinoTHNT13.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TamamoriNT13,
author = {Akira Tamamori and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Image recognition based on separable lattice trajectory 2-D {HMMS}},
booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
{ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
pages = {3467--3471},
publisher = {{IEEE}},
year = {2013},
url = {https://doi.org/10.1109/ICASSP.2013.6638302},
doi = {10.1109/ICASSP.2013.6638302},
timestamp = {Fri, 19 May 2017 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/TamamoriNT13.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TakakiNT13,
author = {Shinji Takaki and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Contextual partial additive structure for HMM-based speech synthesis},
booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
{ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
pages = {7878--7882},
publisher = {{IEEE}},
year = {2013},
url = {https://doi.org/10.1109/ICASSP.2013.6639198},
doi = {10.1109/ICASSP.2013.6639198},
timestamp = {Fri, 19 May 2017 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/TakakiNT13.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/NakamuraHNT13,
author = {Kazuhiro Nakamura and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Integration of acoustic modeling and mel-cepstral analysis for HMM-based
speech synthesis},
booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
{ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
pages = {7883--7887},
publisher = {{IEEE}},
year = {2013},
url = {https://doi.org/10.1109/ICASSP.2013.6639199},
doi = {10.1109/ICASSP.2013.6639199},
timestamp = {Fri, 19 May 2017 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/NakamuraHNT13.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/YoshimuraHONT13,
author = {Takenori Yoshimura and
Kei Hashimoto and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Cross-lingual speaker adaptation based on factor analysis using bilingual
speech data for HMM-based speech synthesis},
booktitle = {The Eighth {ISCA} Tutorial and Research Workshop on Speech Synthesis,
{SSW} 2013, Barcelona, Spain, August 31 - September 2, 2013},
pages = {297--302},
publisher = {{ISCA}},
year = {2013},
url = {https://www.isca-archive.org/ssw\_2013/yoshimura13\_ssw.html},
timestamp = {Fri, 02 Aug 2024 09:01:40 +0200},
biburl = {https://dblp.org/rec/conf/ssw/YoshimuraHONT13.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/TamamoriNT12,
author = {Akira Tamamori and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {An Extension of Separable Lattice 2-D HMMs for Rotational Data Variations},
journal = {{IEICE} Trans. Inf. Syst.},
volume = {95-D},
number = {8},
pages = {2074--2083},
year = {2012},
url = {https://doi.org/10.1587/transinf.E95.D.2074},
doi = {10.1587/TRANSINF.E95.D.2074},
timestamp = {Sat, 11 Apr 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/ieicet/TamamoriNT12.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/ZenGNT12,
author = {Heiga Zen and
Mark J. F. Gales and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Product of Experts for Statistical Parametric Speech Synthesis},
journal = {{IEEE} Trans. Speech Audio Process.},
volume = {20},
number = {3},
pages = {794--805},
year = {2012},
url = {https://doi.org/10.1109/TASL.2011.2165280},
doi = {10.1109/TASL.2011.2165280},
timestamp = {Sun, 06 Oct 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/taslp/ZenGNT12.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SawadaTHNT12,
author = {Kei Sawada and
Akira Tamamori and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Face recognition based on separable lattice 2-D {HMMS} using variational
bayesian method},
booktitle = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
pages = {2205--2208},
publisher = {{IEEE}},
year = {2012},
url = {https://doi.org/10.1109/ICASSP.2012.6288351},
doi = {10.1109/ICASSP.2012.6288351},
timestamp = {Wed, 16 Oct 2019 14:14:52 +0200},
biburl = {https://dblp.org/rec/conf/icassp/SawadaTHNT12.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KumakiNT12,
author = {Keisuke Kumaki and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Face recognition based on extended separable lattice 2-D {HMMS}},
booktitle = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
pages = {2209--2212},
publisher = {{IEEE}},
year = {2012},
url = {https://doi.org/10.1109/ICASSP.2012.6288352},
doi = {10.1109/ICASSP.2012.6288352},
timestamp = {Fri, 19 May 2017 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/KumakiNT12.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ShiotaHNT12,
author = {Sayaka Shiota and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {A model structure integration based on a Bayesian framework for speech
recognition},
booktitle = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
pages = {4813--4816},
publisher = {{IEEE}},
year = {2012},
url = {https://doi.org/10.1109/ICASSP.2012.6288996},
doi = {10.1109/ICASSP.2012.6288996},
timestamp = {Fri, 19 May 2017 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/ShiotaHNT12.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/OuraMNT12,
author = {Keiichiro Oura and
Ayami Mase and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Pitch adaptive training for hmm-based singing voice synthesis},
booktitle = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
pages = {5377--5380},
publisher = {{IEEE}},
year = {2012},
url = {https://doi.org/10.1109/ICASSP.2012.6289136},
doi = {10.1109/ICASSP.2012.6289136},
timestamp = {Fri, 19 May 2017 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/OuraMNT12.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/OliveiraSNT12,
author = {Viviane de Franca Oliveira and
Sayaka Shiota and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Cross-lingual Speaker Adaptation for HMM-based Speech Synthesis based
on Perceptual Characteristics and Speaker Interpolation},
booktitle = {13th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2012, Portland, Oregon, USA, September 9-13, 2012},
pages = {983--986},
publisher = {{ISCA}},
year = {2012},
url = {https://doi.org/10.21437/Interspeech.2012-292},
doi = {10.21437/INTERSPEECH.2012-292},
timestamp = {Tue, 11 Jun 2024 16:45:43 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/OliveiraSNT12.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HattoriHNT12,
author = {Takafumi Hattori and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {A Bayesian Approach to Speaker Recognition Based on GMMs Using Multiple
Model Structures},
booktitle = {13th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2012, Portland, Oregon, USA, September 9-13, 2012},
pages = {1107--1110},
publisher = {{ISCA}},
year = {2012},
url = {https://doi.org/10.21437/Interspeech.2012-334},
doi = {10.21437/INTERSPEECH.2012-334},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/HattoriHNT12.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/HashimotoZNLT11,
author = {Kei Hashimoto and
Heiga Zen and
Yoshihiko Nankaku and
Akinobu Lee and
Keiichi Tokuda},
title = {Bayesian Context Clustering Using Cross Validation for Speech Recognition},
journal = {{IEICE} Trans. Inf. Syst.},
volume = {94-D},
number = {3},
pages = {668--678},
year = {2011},
url = {https://doi.org/10.1587/transinf.E94.D.668},
doi = {10.1587/TRANSINF.E94.D.668},
timestamp = {Sat, 11 Apr 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/ieicet/HashimotoZNLT11.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/ZenNT11,
author = {Heiga Zen and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Continuous Stochastic Feature Mapping Based on Trajectory HMMs},
journal = {{IEEE} Trans. Speech Audio Process.},
volume = {19},
number = {2},
pages = {417--430},
year = {2011},
url = {https://doi.org/10.1109/TASL.2010.2049685},
doi = {10.1109/TASL.2010.2049685},
timestamp = {Sun, 06 Oct 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/taslp/ZenNT11.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TakakiONT11,
author = {Shinji Takaki and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {An optimization algorithm of independent mean and variance parameter
tying structures for HMM-based speech synthesis},
booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress
Center, Prague, Czech Republic},
pages = {4700--4703},
publisher = {{IEEE}},
year = {2011},
url = {https://doi.org/10.1109/ICASSP.2011.5947404},
doi = {10.1109/ICASSP.2011.5947404},
timestamp = {Fri, 19 May 2017 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/TakakiONT11.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PanNTT11,
author = {Shifeng Pan and
Yoshihiko Nankaku and
Keiichi Tokuda and
Jianhua Tao},
title = {Global variance modeling on frequency domain delta {LSP} for HMM-based
speech synthesis},
booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress
Center, Prague, Czech Republic},
pages = {4716--4719},
publisher = {{IEEE}},
year = {2011},
url = {https://doi.org/10.1109/ICASSP.2011.5947408},
doi = {10.1109/ICASSP.2011.5947408},
timestamp = {Mon, 18 Mar 2024 00:00:00 +0100},
biburl = {https://dblp.org/rec/conf/icassp/PanNTT11.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HashimotoNT11,
author = {Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Multi-Speaker Modeling with Shared Prior Distributions and Model Structures
for Bayesian Speech Synthesis},
booktitle = {12th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2011, Florence, Italy, August 27-31, 2011},
pages = {113--116},
publisher = {{ISCA}},
year = {2011},
url = {https://doi.org/10.21437/Interspeech.2011-29},
doi = {10.21437/INTERSPEECH.2011-29},
timestamp = {Tue, 11 Jun 2024 16:45:43 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/HashimotoNT11.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LiNT11,
author = {Lei Li and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {A Bayesian Approach to Voice Conversion Based on GMMs Using Multiple
Model Structures},
booktitle = {12th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2011, Florence, Italy, August 27-31, 2011},
pages = {661--664},
publisher = {{ISCA}},
year = {2011},
url = {https://doi.org/10.21437/Interspeech.2011-270},
doi = {10.21437/INTERSPEECH.2011-270},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/LiNT11.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/RemesNT11,
author = {Ulpu Remes and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {GMM-Based Missing-Feature Reconstruction on Multi-Frame Windows},
booktitle = {12th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2011, Florence, Italy, August 27-31, 2011},
pages = {1665--1668},
publisher = {{ISCA}},
year = {2011},
url = {https://doi.org/10.21437/Interspeech.2011-214},
doi = {10.21437/INTERSPEECH.2011-214},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/RemesNT11.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ChenNZTLD11,
author = {Ling{-}Hui Chen and
Yoshihiko Nankaku and
Heiga Zen and
Keiichi Tokuda and
Zhen{-}Hua Ling and
Li{-}Rong Dai},
title = {Estimation of Window Coefficients for Dynamic Feature Extraction for
HMM-Based Speech Synthesis},
booktitle = {12th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2011, Florence, Italy, August 27-31, 2011},
pages = {1801--1804},
publisher = {{ISCA}},
year = {2011},
url = {https://doi.org/10.21437/Interspeech.2011-33},
doi = {10.21437/INTERSPEECH.2011-33},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/ChenNZTLD11.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ItoNL11,
author = {Naoaki Ito and
Yoshihiko Nankaku and
Akinobu Lee},
title = {Evaluation of Tree-Trellis Based Decoding in Over-Million {LVCSR}},
booktitle = {12th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2011, Florence, Italy, August 27-31, 2011},
pages = {1937--1940},
publisher = {{ISCA}},
year = {2011},
url = {https://doi.org/10.21437/Interspeech.2011-362},
doi = {10.21437/INTERSPEECH.2011-362},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/ItoNL11.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/OuraZNLT10,
author = {Keiichiro Oura and
Heiga Zen and
Yoshihiko Nankaku and
Akinobu Lee and
Keiichi Tokuda},
title = {A Covariance-Tying Technique for HMM-Based Speech Synthesis},
journal = {{IEICE} Trans. Inf. Syst.},
volume = {93-D},
number = {3},
pages = {595--601},
year = {2010},
url = {https://doi.org/10.1587/transinf.E93.D.595},
doi = {10.1587/TRANSINF.E93.D.595},
timestamp = {Sun, 06 Oct 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/ieicet/OuraZNLT10.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eamt/Martinez-GomezH10,
author = {Pascual Mart{\'{\i}}nez{-}G{\'{o}}mez and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda and
Germ{\'{a}}n Sanchis{-}Trilles},
editor = {Fran{\c{c}}ois Yvon and
Viggo Hansen},
title = {A Deterministic Annealing-Based Training Algorithm For Statistical
Machine Translation Models},
booktitle = {Proceedings of the 14th Annual conference of the European Association
for Machine Translation, {EAMT} 2010, Saint Rapha{\"{e}}l, France,
May 27-28, 2010},
publisher = {European Association for Machine Translation},
year = {2010},
url = {https://aclanthology.org/2010.eamt-1.20/},
timestamp = {Fri, 06 Aug 2021 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/eamt/Martinez-GomezH10.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TakahashiTNT10,
author = {Yoshiaki Takahashi and
Akira Tamamori and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Face recognition based on separable lattice 2-D {HMM} with state duration
modeling},
booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
Hotel, Dallas, Texas, {USA}},
pages = {2162--2165},
publisher = {{IEEE}},
year = {2010},
url = {https://doi.org/10.1109/ICASSP.2010.5495625},
doi = {10.1109/ICASSP.2010.5495625},
timestamp = {Fri, 19 May 2017 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/TakahashiTNT10.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/TamamoriNT10,
author = {Akira Tamamori and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {An extension of Separable Lattice 2-D {HMMS} for rotational data variations},
booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
Hotel, Dallas, Texas, {USA}},
pages = {2206--2209},
publisher = {{IEEE}},
year = {2010},
url = {https://doi.org/10.1109/ICASSP.2010.5495735},
doi = {10.1109/ICASSP.2010.5495735},
timestamp = {Fri, 19 May 2017 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/TamamoriNT10.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KazumiNT10,
author = {Kyosuke Kazumi and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Factor analyzed voice models for HMM-based speech synthesis},
booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
Hotel, Dallas, Texas, {USA}},
pages = {4234--4237},
publisher = {{IEEE}},
year = {2010},
url = {https://doi.org/10.1109/ICASSP.2010.5495689},
doi = {10.1109/ICASSP.2010.5495689},
timestamp = {Fri, 19 May 2017 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/KazumiNT10.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ZenGNT10,
author = {Heiga Zen and
Mark J. F. Gales and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Statistical parametric speech synthesis based on product of experts},
booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
Hotel, Dallas, Texas, {USA}},
pages = {4242--4245},
publisher = {{IEEE}},
year = {2010},
url = {https://doi.org/10.1109/ICASSP.2010.5495691},
doi = {10.1109/ICASSP.2010.5495691},
timestamp = {Sun, 06 Oct 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/ZenGNT10.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HayashiNLT10,
author = {Toyohiro Hayashi and
Yoshihiko Nankaku and
Akinobu Lee and
Keiichi Tokuda},
editor = {Takao Kobayashi and
Keikichi Hirose and
Satoshi Nakamura},
title = {Speaker adaptation based on nonlinear spectral transform for speech
recognition},
booktitle = {11th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2010, Makuhari, Chiba, Japan, September 26-30, 2010},
pages = {542--545},
publisher = {{ISCA}},
year = {2010},
url = {https://doi.org/10.21437/Interspeech.2010-218},
doi = {10.21437/INTERSPEECH.2010-218},
timestamp = {Tue, 11 Jun 2024 16:45:43 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/HayashiNLT10.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/MaseONT10,
author = {Ayami Mase and
Keiichiro Oura and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Takao Kobayashi and
Keikichi Hirose and
Satoshi Nakamura},
title = {HMM-based singing voice synthesis system using pitch-shifted pseudo
training data},
booktitle = {11th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2010, Makuhari, Chiba, Japan, September 26-30, 2010},
pages = {845--848},
publisher = {{ISCA}},
year = {2010},
url = {https://doi.org/10.21437/Interspeech.2010-188},
doi = {10.21437/INTERSPEECH.2010-188},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/MaseONT10.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SaitoNLT10,
author = {Akira Saito and
Yoshihiko Nankaku and
Akinobu Lee and
Keiichi Tokuda},
editor = {Takao Kobayashi and
Keikichi Hirose and
Satoshi Nakamura},
title = {Voice activity detection based on conditional random fields using
multiple features},
booktitle = {11th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2010, Makuhari, Chiba, Japan, September 26-30, 2010},
pages = {2086--2089},
publisher = {{ISCA}},
year = {2010},
url = {https://doi.org/10.21437/Interspeech.2010-588},
doi = {10.21437/INTERSPEECH.2010-588},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/SaitoNLT10.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/TakakiNT10,
author = {Shinji Takaki and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Yoshinori Sagisaka and
Keiichi Tokuda},
title = {Spectral modeling with contextual additive structure for HMM-based
speech synthesis},
booktitle = {The Seventh {ISCA} Tutorial and Research Workshop on Speech Synthesis,
{SSW} 2010, Kyoto, Japan, September 22-24, 2010},
pages = {100--105},
publisher = {{ISCA}},
year = {2010},
url = {https://www.isca-archive.org/ssw\_2010/takaki10\_ssw.html},
timestamp = {Fri, 02 Aug 2024 09:01:35 +0200},
biburl = {https://dblp.org/rec/conf/ssw/TakakiNT10.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/HashimotoNT10,
author = {Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Yoshinori Sagisaka and
Keiichi Tokuda},
title = {Bayesian speech synthesis framework integrating training and synthesis
processes},
booktitle = {The Seventh {ISCA} Tutorial and Research Workshop on Speech Synthesis,
{SSW} 2010, Kyoto, Japan, September 22-24, 2010},
pages = {106--111},
publisher = {{ISCA}},
year = {2010},
url = {https://www.isca-archive.org/ssw\_2010/hashimoto10\_ssw.html},
timestamp = {Wed, 31 Jul 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/ssw/HashimotoNT10.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/OuraMYMNT10,
author = {Keiichiro Oura and
Ayami Mase and
Tomohiko Yamada and
Satoru Muto and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Yoshinori Sagisaka and
Keiichi Tokuda},
title = {Recent development of the HMM-based singing voice synthesis system
- Sinsy},
booktitle = {The Seventh {ISCA} Tutorial and Research Workshop on Speech Synthesis,
{SSW} 2010, Kyoto, Japan, September 22-24, 2010},
pages = {211--216},
publisher = {{ISCA}},
year = {2010},
url = {https://www.isca-archive.org/ssw\_2010/oura10\_ssw.html},
timestamp = {Wed, 31 Jul 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/ssw/OuraMYMNT10.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/YutaniUNLT09,
author = {Kaori Yutani and
Yosuke Uto and
Yoshihiko Nankaku and
Akinobu Lee and
Keiichi Tokuda},
title = {Voice conversion based on simultaneous modelling of spectrum and {F0}},
booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
pages = {3897--3900},
publisher = {{IEEE}},
year = {2009},
url = {https://doi.org/10.1109/ICASSP.2009.4960479},
doi = {10.1109/ICASSP.2009.4960479},
timestamp = {Thu, 23 Mar 2023 00:00:00 +0100},
biburl = {https://dblp.org/rec/conf/icassp/YutaniUNLT09.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HashimotoZNMT09,
author = {Kei Hashimoto and
Heiga Zen and
Yoshihiko Nankaku and
Takashi Masuko and
Keiichi Tokuda},
title = {A Bayesian approach to HMM-based speech synthesis},
booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
pages = {4029--4032},
publisher = {{IEEE}},
year = {2009},
url = {https://doi.org/10.1109/ICASSP.2009.4960512},
doi = {10.1109/ICASSP.2009.4960512},
timestamp = {Sun, 06 Oct 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/HashimotoZNMT09.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ZenNT09,
author = {Heiga Zen and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Stereo-based stochastic noise compensation based on trajectory {GMMS}},
booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
pages = {4577--4580},
publisher = {{IEEE}},
year = {2009},
url = {https://doi.org/10.1109/ICASSP.2009.4960649},
doi = {10.1109/ICASSP.2009.4960649},
timestamp = {Sun, 06 Oct 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/ZenNT09.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/WuNT09,
author = {Yi{-}Jian Wu and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {State mapping based method for cross-lingual speaker adaptation in
HMM-based speech synthesis},
booktitle = {10th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2009, Brighton, United Kingdom, September 6-10, 2009},
pages = {528--531},
publisher = {{ISCA}},
year = {2009},
url = {https://doi.org/10.21437/Interspeech.2009-192},
doi = {10.21437/INTERSPEECH.2009-192},
timestamp = {Tue, 11 Jun 2024 16:45:43 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/WuNT09.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ShiotaHNT09,
author = {Sayaka Shiota and
Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Deterministic annealing based training algorithm for Bayesian speech
recognition},
booktitle = {10th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2009, Brighton, United Kingdom, September 6-10, 2009},
pages = {680--683},
publisher = {{ISCA}},
year = {2009},
url = {https://doi.org/10.21437/Interspeech.2009-236},
doi = {10.21437/INTERSPEECH.2009-236},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/ShiotaHNT09.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HashimotoNT09,
author = {Kei Hashimoto and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {A Bayesian approach to Hidden Semi-Markov Model based speech synthesis},
booktitle = {10th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2009, Brighton, United Kingdom, September 6-10, 2009},
pages = {1751--1754},
publisher = {{ISCA}},
year = {2009},
url = {https://doi.org/10.21437/Interspeech.2009-141},
doi = {10.21437/INTERSPEECH.2009-141},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/HashimotoNT09.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/OuraZNLT09,
author = {Keiichiro Oura and
Heiga Zen and
Yoshihiko Nankaku and
Akinobu Lee and
Keiichi Tokuda},
title = {Tying covariance matrices to reduce the footprint of HMM-based speech
synthesis systems},
booktitle = {10th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2009, Brighton, United Kingdom, September 6-10, 2009},
pages = {1759--1762},
publisher = {{ISCA}},
year = {2009},
url = {https://doi.org/10.21437/Interspeech.2009-143},
doi = {10.21437/INTERSPEECH.2009-143},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/OuraZNLT09.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/OuraZNLT08,
author = {Keiichiro Oura and
Heiga Zen and
Yoshihiko Nankaku and
Akinobu Lee and
Keiichi Tokuda},
title = {A Fully Consistent Hidden Semi-Markov Model-Based Speech Recognition
System},
journal = {{IEICE} Trans. Inf. Syst.},
volume = {91-D},
number = {11},
pages = {2693--2700},
year = {2008},
url = {https://doi.org/10.1093/ietisy/e91-d.11.2693},
doi = {10.1093/IETISY/E91-D.11.2693},
timestamp = {Sun, 06 Oct 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/ieicet/OuraZNLT08.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/NankakuNZT08,
author = {Yoshihiko Nankaku and
Kazuhiro Nakamura and
Heiga Zen and
Keiichi Tokuda},
title = {Acoustic modeling with contextual additive structure for HMM-based
speech recognition},
booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
and Signal Processing, {ICASSP} 2008, March 30 - April 4, 2008, Caesars
Palace, Las Vegas, Nevada, {USA}},
pages = {4469--4472},
publisher = {{IEEE}},
year = {2008},
url = {https://doi.org/10.1109/ICASSP.2008.4518648},
doi = {10.1109/ICASSP.2008.4518648},
timestamp = {Sun, 06 Oct 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/NankakuNZT08.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/YoshimiKNLT08,
author = {Yoshitaka Yoshimi and
Ryota Kakitsuba and
Yoshihiko Nankaku and
Akinobu Lee and
Keiichi Tokuda},
title = {Probabilistic answer selection based on conditional random fields
for spoken dialog system},
booktitle = {9th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
pages = {215--218},
publisher = {{ISCA}},
year = {2008},
url = {https://doi.org/10.21437/Interspeech.2008-67},
doi = {10.21437/INTERSPEECH.2008-67},
timestamp = {Tue, 11 Jun 2024 16:45:43 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/YoshimiKNLT08.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ShiotaHZNLT08,
author = {Sayaka Shiota and
Kei Hashimoto and
Heiga Zen and
Yoshihiko Nankaku and
Akinobu Lee and
Keiichi Tokuda},
title = {Acoustic modeling based on model structure annealing for speech recognition},
booktitle = {9th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
pages = {932--935},
publisher = {{ISCA}},
year = {2008},
url = {https://doi.org/10.21437/Interspeech.2008-111},
doi = {10.21437/INTERSPEECH.2008-111},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/ShiotaHZNLT08.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HashimotoZNLT08,
author = {Kei Hashimoto and
Heiga Zen and
Yoshihiko Nankaku and
Akinobu Lee and
Keiichi Tokuda},
title = {Bayesian context clustering using cross valid prior distribution for
HMM-based speech recognition},
booktitle = {9th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
pages = {936--939},
publisher = {{ISCA}},
year = {2008},
url = {https://doi.org/10.21437/Interspeech.2008-112},
doi = {10.21437/INTERSPEECH.2008-112},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/HashimotoZNLT08.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ZenNT08,
author = {Heiga Zen and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Probabilistic feature mapping based on trajectory HMMs},
booktitle = {9th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
pages = {1068--1071},
publisher = {{ISCA}},
year = {2008},
url = {https://doi.org/10.21437/Interspeech.2008-330},
doi = {10.21437/INTERSPEECH.2008-330},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/ZenNT08.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/YutaniUNTT08,
author = {Kaori Yutani and
Yosuke Uto and
Yoshihiko Nankaku and
Tomoki Toda and
Keiichi Tokuda},
title = {Simultaneous conversion of duration and spectrum based on statistical
models including time-sequence matching},
booktitle = {9th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
pages = {1072--1075},
publisher = {{ISCA}},
year = {2008},
url = {https://doi.org/10.21437/Interspeech.2008-331},
doi = {10.21437/INTERSPEECH.2008-331},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/YutaniUNTT08.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ItoHNLT08,
author = {Tatsuya Ito and
Kei Hashimoto and
Yoshihiko Nankaku and
Akinobu Lee and
Keiichi Tokuda},
title = {Speaker recognition based on variational Bayesian method},
booktitle = {9th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
pages = {1417--1420},
publisher = {{ISCA}},
year = {2008},
url = {https://doi.org/10.21437/Interspeech.2008-410},
doi = {10.21437/INTERSPEECH.2008-410},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/ItoHNLT08.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iscslp/OuraNTTMSN08,
author = {Keiichiro Oura and
Yoshihiko Nankaku and
Tomoki Toda and
Keiichi Tokuda and
Ranniery Maia and
Shinsuke Sakai and
Satoshi Nakamura},
editor = {Helen M. Meng and
Hui Jiang and
Jianhua Tao and
Ren{-}Hua Wang},
title = {Simultaneous Acoustic, Prosodic, and Phrasing Model Training for TTs
Conversion Systems},
booktitle = {6th International Symposium on Chinese Spoken Language Processing,
{ISCSLP} 2008, 16-19 December, 2008, Kunming, China},
pages = {1--4},
publisher = {{IEEE}},
year = {2008},
url = {https://doi.org/10.1109/CHINSL.2008.ECP.12},
doi = {10.1109/CHINSL.2008.ECP.12},
timestamp = {Wed, 18 Sep 2024 12:50:19 +0200},
biburl = {https://dblp.org/rec/conf/iscslp/OuraNTTMSN08.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/NankakuT07,
author = {Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Face Recognition using Hidden Markov Eigenface Models},
booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
and Signal Processing, {ICASSP} 2007, Honolulu, Hawaii, USA, April
15-20, 2007},
pages = {469--472},
publisher = {{IEEE}},
year = {2007},
url = {https://doi.org/10.1109/ICASSP.2007.366274},
doi = {10.1109/ICASSP.2007.366274},
timestamp = {Mon, 22 Jun 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/NankakuT07.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/MaiaTZNT07,
author = {Ranniery Maia and
Tomoki Toda and
Heiga Zen and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {A trainable excitation model for HMM-based speech synthesis},
booktitle = {8th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2007, Antwerp, Belgium, August 27-31, 2007},
pages = {1909--1912},
publisher = {{ISCA}},
year = {2007},
url = {https://doi.org/10.21437/Interspeech.2007-530},
doi = {10.21437/INTERSPEECH.2007-530},
timestamp = {Tue, 11 Jun 2024 16:45:43 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/MaiaTZNT07.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ZenNT07,
author = {Heiga Zen and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Model-space {MLLR} for trajectory HMMs},
booktitle = {8th Annual Conference of the International Speech Communication Association,
{INTERSPEECH} 2007, Antwerp, Belgium, August 27-31, 2007},
pages = {2065--2068},
publisher = {{ISCA}},
year = {2007},
url = {https://doi.org/10.21437/Interspeech.2007-559},
doi = {10.21437/INTERSPEECH.2007-559},
timestamp = {Fri, 23 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/ZenNT07.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/MaiaTZNT07,
author = {Ranniery Maia and
Tomoki Toda and
Heiga Zen and
Yoshihiko Nankaku and
Keiichi Tokuda},
editor = {Petra Wagner and
Julia Abresch and
Stefan Breuer and
Wolfgang Hess},
title = {An excitation model for HMM-based speech synthesis based on residual
modeling},
booktitle = {Sixth {ISCA} Workshop on Speech Synthesis, {SSW} 2007, Bonn, Germany,
August 22-24, 2007},
pages = {131--136},
publisher = {{ISCA}},
year = {2007},
url = {https://www.isca-archive.org/ssw\_2007/maia07\_ssw.html},
timestamp = {Fri, 02 Aug 2024 09:01:26 +0200},
biburl = {https://dblp.org/rec/conf/ssw/MaiaTZNT07.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/NankakuNTT07,
author = {Yoshihiko Nankaku and
Kenichi Nakamura and
Tomoki Toda and
Keiichi Tokuda},
editor = {Petra Wagner and
Julia Abresch and
Stefan Breuer and
Wolfgang Hess},
title = {Spectral conversion based on statistical models including time-sequence
matching},
booktitle = {Sixth {ISCA} Workshop on Speech Synthesis, {SSW} 2007, Bonn, Germany,
August 22-24, 2007},
pages = {333--338},
publisher = {{ISCA}},
year = {2007},
url = {https://www.isca-archive.org/ssw\_2007/nankaku07\_ssw.html},
timestamp = {Wed, 31 Jul 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/ssw/NankakuNTT07.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/OuraZNLT06,
author = {Keiichiro Oura and
Heiga Zen and
Yoshihiko Nankaku and
Akinobu Lee and
Keiichi Tokuda},
title = {Hidden Semi-Markov Model Based Speech Recognition System using Weighted
Finite-State Transducer},
booktitle = {2006 {IEEE} International Conference on Acoustics Speech and Signal
Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
pages = {33--36},
publisher = {{IEEE}},
year = {2006},
url = {https://doi.org/10.1109/ICASSP.2006.1659950},
doi = {10.1109/ICASSP.2006.1659950},
timestamp = {Mon, 22 Jun 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/OuraZNLT06.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/NakamuraTNT06,
author = {Kenichi Nakamura and
Tomoki Toda and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {On the Use of Phonetic Information for Mapping from Articulatory Movements
to Vocal Tract Spectrum},
booktitle = {2006 {IEEE} International Conference on Acoustics Speech and Signal
Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
pages = {93--96},
publisher = {{IEEE}},
year = {2006},
url = {https://doi.org/10.1109/ICASSP.2006.1659965},
doi = {10.1109/ICASSP.2006.1659965},
timestamp = {Mon, 22 Jun 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/NakamuraTNT06.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KurataNTKG06,
author = {Daisuke Kurata and
Yoshihiko Nankaku and
Keiichi Tokuda and
Tadashi Kitamura and
Zoubin Ghahramani},
title = {Face Recognition Based on Separable Lattice {HMMS}},
booktitle = {2006 {IEEE} International Conference on Acoustics Speech and Signal
Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
pages = {737--740},
publisher = {{IEEE}},
year = {2006},
url = {https://doi.org/10.1109/ICASSP.2006.1661381},
doi = {10.1109/ICASSP.2006.1661381},
timestamp = {Mon, 22 Jun 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/KurataNTKG06.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ZenNTK06,
author = {Heiga Zen and
Yoshihiko Nankaku and
Keiichi Tokuda and
Tadashi Kitamura},
title = {Estimating Trajectory Hmm Parameters Using Monte Carlo Em With Gibbs
Sampler},
booktitle = {2006 {IEEE} International Conference on Acoustics Speech and Signal
Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
pages = {1173--1176},
publisher = {{IEEE}},
year = {2006},
url = {https://doi.org/10.1109/ICASSP.2006.1660235},
doi = {10.1109/ICASSP.2006.1660235},
timestamp = {Mon, 22 Jun 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/ZenNTK06.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HakamataLNT06,
author = {Tomohiro Hakamata and
Akinobu Lee and
Yoshihiko Nankaku and
Keiichi Tokuda},
title = {Reducing computation on parallel decoding using frame-wise confidence
scores},
booktitle = {Ninth International Conference on Spoken Language Processing, {INTERSPEECH-ICSLP}
2006, Pittsburgh, PA, USA, September 17-21, 2006},
publisher = {{ISCA}},
year = {2006},
url = {https://doi.org/10.21437/Interspeech.2006-457},
doi = {10.21437/INTERSPEECH.2006-457},
timestamp = {Tue, 11 Jun 2024 16:45:43 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/HakamataLNT06.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SainoZNLT06,
author = {Keijiro Saino and
Heiga Zen and
Yoshihiko Nankaku and
Akinobu Lee and
Keiichi Tokuda},
title = {An HMM-based singing voice synthesis system},
booktitle = {Ninth International Conference on Spoken Language Processing, {INTERSPEECH-ICSLP}
2006, Pittsburgh, PA, USA, September 17-21, 2006},
publisher = {{ISCA}},
year = {2006},
url = {https://doi.org/10.21437/Interspeech.2006-584},
doi = {10.21437/INTERSPEECH.2006-584},
timestamp = {Thu, 22 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/SainoZNLT06.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/UtoNTLT06,
author = {Yosuke Uto and
Yoshihiko Nankaku and
Tomoki Toda and
Akinobu Lee and
Keiichi Tokuda},
title = {Voice conversion based on mixtures of factor analyzers},
booktitle = {Ninth International Conference on Spoken Language Processing, {INTERSPEECH-ICSLP}
2006, Pittsburgh, PA, USA, September 17-21, 2006},
publisher = {{ISCA}},
year = {2006},
url = {https://doi.org/10.21437/Interspeech.2006-585},
doi = {10.21437/INTERSPEECH.2006-585},
timestamp = {Thu, 22 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/UtoNTLT06.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ZenNTK06,
author = {Heiga Zen and
Yoshihiko Nankaku and
Keiichi Tokuda and
Tadashi Kitamura},
title = {Speaker adaptation of trajectory HMMs using feature-space {MLLR}},
booktitle = {Ninth International Conference on Spoken Language Processing, {INTERSPEECH-ICSLP}
2006, Pittsburgh, PA, USA, September 17-21, 2006},
publisher = {{ISCA}},
year = {2006},
url = {https://doi.org/10.21437/Interspeech.2006-348},
doi = {10.21437/INTERSPEECH.2006-348},
timestamp = {Thu, 22 Jun 2023 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/ZenNTK06.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/LimaZNTKR05,
author = {Amaro A. de Lima and
Heiga Zen and
Yoshihiko Nankaku and
Keiichi Tokuda and
Tadashi Kitamura and
Fernando Gil Resende},
title = {Applying Sparse {KPCA} for Feature Extraction in Speech Recognition},
journal = {{IEICE} Trans. Inf. Syst.},
volume = {88-D},
number = {3},
pages = {401--409},
year = {2005},
url = {http://search.ieice.org/bin/summary.php?id=e88-d\_3\_401\&\#38;category=D\&\#38;year=2005\&\#38;lang=E\&\#38;abst=},
timestamp = {Thu, 23 Mar 2023 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/ieicet/LimaZNTKR05.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/SuzukiZNMTK05,
author = {Hiroyuki Suzuki and
Heiga Zen and
Yoshihiko Nankaku and
Chiyomi Miyajima and
Keiichi Tokuda and
Tadashi Kitamura},
title = {Continuous Speech Recognition Based on General Factor Dependent Acoustic
Models},
journal = {{IEICE} Trans. Inf. Syst.},
volume = {88-D},
number = {3},
pages = {410--417},
year = {2005},
url = {http://search.ieice.org/bin/summary.php?id=e88-d\_3\_410\&\#38;category=D\&\#38;year=2005\&\#38;lang=E\&\#38;abst=},
timestamp = {Sat, 11 Apr 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/ieicet/SuzukiZNMTK05.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/YamamotoNMTK05,
author = {Hiroyoshi Yamamoto and
Yoshihiko Nankaku and
Chiyomi Miyajima and
Keiichi Tokuda and
Tadashi Kitamura},
title = {Parameter Sharing in Mixture of Factor Analyzers for Speaker Identification},
journal = {{IEICE} Trans. Inf. Syst.},
volume = {88-D},
number = {3},
pages = {418--424},
year = {2005},
url = {http://search.ieice.org/bin/summary.php?id=e88-d\_3\_418\&\#38;category=D\&\#38;year=2005\&\#38;lang=E\&\#38;abst=},
timestamp = {Sat, 11 Apr 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/ieicet/YamamotoNMTK05.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/ItayaZNMTK05,
author = {Yohei Itaya and
Heiga Zen and
Yoshihiko Nankaku and
Chiyomi Miyajima and
Keiichi Tokuda and
Tadashi Kitamura},
title = {Deterministic Annealing {EM} Algorithm in Acoustic Modeling for Speaker
and Speech Recognition},
journal = {{IEICE} Trans. Inf. Syst.},
volume = {88-D},
number = {3},
pages = {425--431},
year = {2005},
url = {http://search.ieice.org/bin/summary.php?id=e88-d\_3\_425\&\#38;category=D\&\#38;year=2005\&\#38;lang=E\&\#38;abst=},
timestamp = {Sat, 11 Apr 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/ieicet/ItayaZNMTK05.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/LimaZNTKR05,
author = {Amaro A. de Lima and
Heiga Zen and
Yoshihiko Nankaku and
Keiichi Tokuda and
Tadashi Kitamura and
Fernando Gil Resende},
title = {Sparse {KPCA} for Feature Extraction in Speech Recognition},
booktitle = {2005 {IEEE} International Conference on Acoustics, Speech, and Signal
Processing, {ICASSP} '05, Philadelphia, Pennsylvania, USA, March 18-23,
2005},
pages = {353--356},
publisher = {{IEEE}},
year = {2005},
url = {https://doi.org/10.1109/ICASSP.2005.1415123},
doi = {10.1109/ICASSP.2005.1415123},
timestamp = {Sun, 06 Oct 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/LimaZNTKR05.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ieicet/LimaZNMTK04,
author = {Amaro A. de Lima and
Heiga Zen and
Yoshihiko Nankaku and
Chiyomi Miyajima and
Keiichi Tokuda and
Tadashi Kitamura},
title = {On the Use of Kernel {PCA} for Feature Extraction in Speech Recognition},
journal = {{IEICE} Trans. Inf. Syst.},
volume = {87-D},
number = {12},
pages = {2802--2811},
year = {2004},
url = {http://search.ieice.org/bin/summary.php?id=e87-d\_12\_2802},
timestamp = {Thu, 23 Mar 2023 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/ieicet/LimaZNMTK04.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/YamamotoNMTK04,
author = {Hiroyoshi Yamamoto and
Yoshihiko Nankaku and
Chiyomi Miyajima and
Keiichi Tokuda and
Tadashi Kitamura},
title = {Parameter sharing and minimum classification error training of mixtures
of factor analyzers for speaker identification},
booktitle = {2004 {IEEE} International Conference on Acoustics, Speech, and Signal
Processing, {ICASSP} 2004, Montreal, Quebec, Canada, May 17-21, 2004},
pages = {29--32},
publisher = {{IEEE}},
year = {2004},
url = {https://doi.org/10.1109/ICASSP.2004.1325914},
doi = {10.1109/ICASSP.2004.1325914},
timestamp = {Mon, 22 Jun 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/YamamotoNMTK04.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ItayaZNMTK04,
author = {Yohei Itaya and
Heiga Zen and
Yoshihiko Nankaku and
Chiyomi Miyajima and
Keiichi Tokuda and
Tadashi Kitamura},
title = {Deterministic annealing {EM} algorithm in parameter estimation for
acoustic model},
booktitle = {8th International Conference on Spoken Language Processing, {INTERSPEECH-ICSLP}
2004, Jeju Island, Korea, October 4-8, 2004},
pages = {433--436},
publisher = {{ISCA}},
year = {2004},
url = {https://doi.org/10.21437/Interspeech.2004-176},
doi = {10.21437/INTERSPEECH.2004-176},
timestamp = {Tue, 11 Jun 2024 16:45:43 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/ItayaZNMTK04.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SuzukiZNMTK03,
author = {Hiroyuki Suzuki and
Heiga Zen and
Yoshihiko Nankaku and
Chiyomi Miyajima and
Keiichi Tokuda and
Tadashi Kitamura},
title = {Speech recognition using voice-characteristic-dependent acoustic models},
booktitle = {2003 {IEEE} International Conference on Acoustics, Speech, and Signal
Processing, {ICASSP} '03, Hong Kong, April 6-10, 2003},
pages = {740--743},
publisher = {{IEEE}},
year = {2003},
url = {https://doi.org/10.1109/ICASSP.2003.1198887},
doi = {10.1109/ICASSP.2003.1198887},
timestamp = {Mon, 22 Jun 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/icassp/SuzukiZNMTK03.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LimaZNMTK03,
author = {Amaro A. de Lima and
Heiga Zen and
Yoshihiko Nankaku and
Chiyomi Miyajima and
Keiichi Tokuda and
Tadashi Kitamura},
title = {On the use of kernel {PCA} for feature extraction in speech recognition},
booktitle = {8th European Conference on Speech Communication and Technology, {EUROSPEECH}
2003 - {INTERSPEECH} 2003, Geneva, Switzerland, September 1-4, 2003},
pages = {2625--2628},
publisher = {{ISCA}},
year = {2003},
url = {https://doi.org/10.21437/Eurospeech.2003-704},
doi = {10.21437/EUROSPEECH.2003-704},
timestamp = {Thu, 22 Jun 2023 16:42:17 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/LimaZNMTK03.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icip/NankakuTKK00,
author = {Yoshihiko Nankaku and
Keiichi Tokuda and
Tadashi Kitamura and
Takao Kobayashi},
title = {Normalized Training for HMM-Based Visual Speech Recognition},
booktitle = {Proceedings of the 2000 International Conference on Image Processing,
{ICIP} 2000, Vancouver, BC, Canada, September 10-13, 2000},
pages = {234--237},
publisher = {{IEEE}},
year = {2000},
url = {https://doi.org/10.1109/ICIP.2000.899338},
doi = {10.1109/ICIP.2000.899338},
timestamp = {Wed, 16 Oct 2019 14:14:52 +0200},
biburl = {https://dblp.org/rec/conf/icip/NankakuTKK00.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/NankakuTK99,
author = {Yoshihiko Nankaku and
Keiichi Tokuda and
Tadashi Kitamura},
title = {Intensity- and location-normalized training for HMM-based visual speech
recognition},
booktitle = {Sixth European Conference on Speech Communication and Technology,
{EUROSPEECH} 1999, Budapest, Hungary, September 5-9, 1999},
pages = {1287--1290},
publisher = {{ISCA}},
year = {1999},
url = {https://doi.org/10.21437/Eurospeech.1999-329},
doi = {10.21437/EUROSPEECH.1999-329},
timestamp = {Wed, 18 Sep 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/interspeech/NankakuTK99.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
manage site settings
To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.