2021
|
Yanpei Shi; Qiang Huang; Thomas Hain: H-VECTORS: Improving the robustness in utterance-level speaker embeddings
using a hierarchical attention model. In: Neural Networks, vol. 142, pp. 329–339, 2021. @article{DBLP:journals/nn/ShiHH21,
title = {H-VECTORS: Improving the robustness in utterance-level speaker embeddings
using a hierarchical attention model},
author = {Yanpei Shi and Qiang Huang and Thomas Hain},
url = {https://doi.org/10.1016/j.neunet.2021.05.024},
doi = {10.1016/j.neunet.2021.05.024},
year = {2021},
date = {2021-01-01},
journal = {Neural Networks},
volume = {142},
pages = {329--339},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
|
Mingjie Chen; Yanpei Shi; Thomas Hain: Towards Low-Resource Stargan Voice Conversion Using Weight Adaptive
Instance Normalization. In: IEEE International Conference on Acoustics, Speech and Signal Processing,
ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021, pp. 5949–5953, IEEE, 2021. @inproceedings{DBLP:conf/icassp/ChenSH21,
title = {Towards Low-Resource Stargan Voice Conversion Using Weight Adaptive
Instance Normalization},
author = {Mingjie Chen and Yanpei Shi and Thomas Hain},
url = {https://doi.org/10.1109/ICASSP39728.2021.9415042},
doi = {10.1109/ICASSP39728.2021.9415042},
year = {2021},
date = {2021-01-01},
booktitle = {IEEE International Conference on Acoustics, Speech and Signal Processing,
ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021},
pages = {5949--5953},
publisher = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Yanpei Shi; Thomas Hain: Contextual Joint Factor Acoustic Embeddings. In: IEEE Spoken Language Technology Workshop, SLT 2021, Shenzhen,
China, January 19-22, 2021, pp. 750–757, IEEE, 2021. @inproceedings{DBLP:conf/slt/ShiH21,
title = {Contextual Joint Factor Acoustic Embeddings},
author = {Yanpei Shi and Thomas Hain},
url = {https://doi.org/10.1109/SLT48900.2021.9383592},
doi = {10.1109/SLT48900.2021.9383592},
year = {2021},
date = {2021-01-01},
booktitle = {IEEE Spoken Language Technology Workshop, SLT 2021, Shenzhen,
China, January 19-22, 2021},
pages = {750--757},
publisher = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Yanpei Shi; Thomas Hain: Supervised Speaker Embedding De-Mixing in Two-Speaker Environment. In: IEEE Spoken Language Technology Workshop, SLT 2021, Shenzhen,
China, January 19-22, 2021, pp. 758–765, IEEE, 2021. @inproceedings{DBLP:conf/slt/ShiH21a,
title = {Supervised Speaker Embedding De-Mixing in Two-Speaker Environment},
author = {Yanpei Shi and Thomas Hain},
url = {https://doi.org/10.1109/SLT48900.2021.9383580},
doi = {10.1109/SLT48900.2021.9383580},
year = {2021},
date = {2021-01-01},
booktitle = {IEEE Spoken Language Technology Workshop, SLT 2021, Shenzhen,
China, January 19-22, 2021},
pages = {758--765},
publisher = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
2020
|
Yanpei Shi; Qiang Huang; Thomas Hain: H-Vectors: Utterance-Level Speaker Embedding Using a Hierarchical
Attention Model. In: 2020 IEEE International Conference on Acoustics, Speech and Signal
Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020, pp. 7579–7583, IEEE, 2020. @inproceedings{DBLP:conf/icassp/ShiHH20,
title = {H-Vectors: Utterance-Level Speaker Embedding Using a Hierarchical
Attention Model},
author = {Yanpei Shi and Qiang Huang and Thomas Hain},
url = {https://doi.org/10.1109/ICASSP40776.2020.9054448},
doi = {10.1109/ICASSP40776.2020.9054448},
year = {2020},
date = {2020-01-01},
booktitle = {2020 IEEE International Conference on Acoustics, Speech and Signal
Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020},
pages = {7579--7583},
publisher = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Yanpei Shi; Qiang Huang; Thomas Hain: Speaker Re-Identification with Speaker Dependent Speech Enhancement. In: Meng, Helen; Xu, Bo; Zheng, Thomas Fang (Ed.): Interspeech 2020, 21st Annual Conference of the International Speech
Communication Association, Virtual Event, Shanghai, China, 25-29 October
2020, pp. 1530–1534, ISCA, 2020. @inproceedings{DBLP:conf/interspeech/Shi0H20,
title = {Speaker Re-Identification with Speaker Dependent Speech Enhancement},
author = {Yanpei Shi and Qiang Huang and Thomas Hain},
editor = {Helen Meng and Bo Xu and Thomas Fang Zheng},
url = {https://doi.org/10.21437/Interspeech.2020-1772},
doi = {10.21437/Interspeech.2020-1772},
year = {2020},
date = {2020-01-01},
booktitle = {Interspeech 2020, 21st Annual Conference of the International Speech
Communication Association, Virtual Event, Shanghai, China, 25-29 October
2020},
pages = {1530--1534},
publisher = {ISCA},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Yanpei Shi; Qiang Huang; Thomas Hain: Weakly Supervised Training of Hierarchical Attention Networks for
Speaker Identification. In: Meng, Helen; Xu, Bo; Zheng, Thomas Fang (Ed.): Interspeech 2020, 21st Annual Conference of the International Speech
Communication Association, Virtual Event, Shanghai, China, 25-29 October
2020, pp. 2992–2996, ISCA, 2020. @inproceedings{DBLP:conf/interspeech/Shi0H20a,
title = {Weakly Supervised Training of Hierarchical Attention Networks for
Speaker Identification},
author = {Yanpei Shi and Qiang Huang and Thomas Hain},
editor = {Helen Meng and Bo Xu and Thomas Fang Zheng},
url = {https://doi.org/10.21437/Interspeech.2020-1774},
doi = {10.21437/Interspeech.2020-1774},
year = {2020},
date = {2020-01-01},
booktitle = {Interspeech 2020, 21st Annual Conference of the International Speech
Communication Association, Virtual Event, Shanghai, China, 25-29 October
2020},
pages = {2992--2996},
publisher = {ISCA},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Yanpei Shi; Qiang Huang; Thomas Hain: Robust Speaker Recognition Using Speech Enhancement And Attention
Model. In: Lee, Kong-Aik; Koshinaka, Takafumi; Shinoda, Koichi (Ed.): Odyssey 2020: The Speaker and Language Recognition Workshop, 1-5 November
2020, Tokyo, Japan, pp. 451–458, ISCA, 2020. @inproceedings{DBLP:conf/odyssey/Shi0H20,
title = {Robust Speaker Recognition Using Speech Enhancement And Attention
Model},
author = {Yanpei Shi and Qiang Huang and Thomas Hain},
editor = {Kong-Aik Lee and Takafumi Koshinaka and Koichi Shinoda},
url = {https://doi.org/10.21437/Odyssey.2020-65},
doi = {10.21437/Odyssey.2020-65},
year = {2020},
date = {2020-01-01},
booktitle = {Odyssey 2020: The Speaker and Language Recognition Workshop, 1-5 November
2020, Tokyo, Japan},
pages = {451--458},
publisher = {ISCA},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|