2021
|
Yanpei Shi; Qiang Huang; Thomas Hain: H-VECTORS: Improving the robustness in utterance-level speaker embeddings
using a hierarchical attention model. In: Neural Networks, vol. 142, pp. 329–339, 2021. @article{DBLP:journals/nn/ShiHH21,
title = {H-VECTORS: Improving the robustness in utterance-level speaker embeddings
using a hierarchical attention model},
author = {Yanpei Shi and Qiang Huang and Thomas Hain},
url = {https://doi.org/10.1016/j.neunet.2021.05.024},
doi = {10.1016/j.neunet.2021.05.024},
year = {2021},
date = {2021-01-01},
journal = {Neural Networks},
volume = {142},
pages = {329--339},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
|
Qiang Huang; Thomas Hain: Improving Audio Anomalies Recognition Using Temporal Convolutional
Attention Networks. In: IEEE International Conference on Acoustics, Speech and Signal Processing,
ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021, pp. 6473–6477, IEEE, 2021. @inproceedings{DBLP:conf/icassp/0008H21,
title = {Improving Audio Anomalies Recognition Using Temporal Convolutional
Attention Networks},
author = {Qiang Huang and Thomas Hain},
url = {https://doi.org/10.1109/ICASSP39728.2021.9414611},
doi = {10.1109/ICASSP39728.2021.9414611},
year = {2021},
date = {2021-01-01},
booktitle = {IEEE International Conference on Acoustics, Speech and Signal Processing,
ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021},
pages = {6473--6477},
publisher = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
2020
|
Yanpei Shi; Qiang Huang; Thomas Hain: H-Vectors: Utterance-Level Speaker Embedding Using a Hierarchical
Attention Model. In: 2020 IEEE International Conference on Acoustics, Speech and Signal
Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020, pp. 7579–7583, IEEE, 2020. @inproceedings{DBLP:conf/icassp/ShiHH20,
title = {H-Vectors: Utterance-Level Speaker Embedding Using a Hierarchical
Attention Model},
author = {Yanpei Shi and Qiang Huang and Thomas Hain},
url = {https://doi.org/10.1109/ICASSP40776.2020.9054448},
doi = {10.1109/ICASSP40776.2020.9054448},
year = {2020},
date = {2020-01-01},
booktitle = {2020 IEEE International Conference on Acoustics, Speech and Signal
Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020},
pages = {7579--7583},
publisher = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Yanpei Shi; Qiang Huang; Thomas Hain: Speaker Re-Identification with Speaker Dependent Speech Enhancement. In: Meng, Helen; Xu, Bo; Zheng, Thomas Fang (Ed.): Interspeech 2020, 21st Annual Conference of the International Speech
Communication Association, Virtual Event, Shanghai, China, 25-29 October
2020, pp. 1530–1534, ISCA, 2020. @inproceedings{DBLP:conf/interspeech/Shi0H20,
title = {Speaker Re-Identification with Speaker Dependent Speech Enhancement},
author = {Yanpei Shi and Qiang Huang and Thomas Hain},
editor = {Helen Meng and Bo Xu and Thomas Fang Zheng},
url = {https://doi.org/10.21437/Interspeech.2020-1772},
doi = {10.21437/Interspeech.2020-1772},
year = {2020},
date = {2020-01-01},
booktitle = {Interspeech 2020, 21st Annual Conference of the International Speech
Communication Association, Virtual Event, Shanghai, China, 25-29 October
2020},
pages = {1530--1534},
publisher = {ISCA},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Yanpei Shi; Qiang Huang; Thomas Hain: Weakly Supervised Training of Hierarchical Attention Networks for
Speaker Identification. In: Meng, Helen; Xu, Bo; Zheng, Thomas Fang (Ed.): Interspeech 2020, 21st Annual Conference of the International Speech
Communication Association, Virtual Event, Shanghai, China, 25-29 October
2020, pp. 2992–2996, ISCA, 2020. @inproceedings{DBLP:conf/interspeech/Shi0H20a,
title = {Weakly Supervised Training of Hierarchical Attention Networks for
Speaker Identification},
author = {Yanpei Shi and Qiang Huang and Thomas Hain},
editor = {Helen Meng and Bo Xu and Thomas Fang Zheng},
url = {https://doi.org/10.21437/Interspeech.2020-1774},
doi = {10.21437/Interspeech.2020-1774},
year = {2020},
date = {2020-01-01},
booktitle = {Interspeech 2020, 21st Annual Conference of the International Speech
Communication Association, Virtual Event, Shanghai, China, 25-29 October
2020},
pages = {2992--2996},
publisher = {ISCA},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Qiang Huang; Thomas Hain: Exploration of Audio Quality Assessment and Anomaly Localisation Using
Attention Models. In: Meng, Helen; Xu, Bo; Zheng, Thomas Fang (Ed.): Interspeech 2020, 21st Annual Conference of the International Speech
Communication Association, Virtual Event, Shanghai, China, 25-29 October
2020, pp. 4611–4615, ISCA, 2020. @inproceedings{DBLP:conf/interspeech/0008H20,
title = {Exploration of Audio Quality Assessment and Anomaly Localisation Using
Attention Models},
author = {Qiang Huang and Thomas Hain},
editor = {Helen Meng and Bo Xu and Thomas Fang Zheng},
url = {https://doi.org/10.21437/Interspeech.2020-1885},
doi = {10.21437/Interspeech.2020-1885},
year = {2020},
date = {2020-01-01},
booktitle = {Interspeech 2020, 21st Annual Conference of the International Speech
Communication Association, Virtual Event, Shanghai, China, 25-29 October
2020},
pages = {4611--4615},
publisher = {ISCA},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Yanpei Shi; Qiang Huang; Thomas Hain: Robust Speaker Recognition Using Speech Enhancement And Attention
Model. In: Lee, Kong-Aik; Koshinaka, Takafumi; Shinoda, Koichi (Ed.): Odyssey 2020: The Speaker and Language Recognition Workshop, 1-5 November
2020, Tokyo, Japan, pp. 451–458, ISCA, 2020. @inproceedings{DBLP:conf/odyssey/Shi0H20,
title = {Robust Speaker Recognition Using Speech Enhancement And Attention
Model},
author = {Yanpei Shi and Qiang Huang and Thomas Hain},
editor = {Kong-Aik Lee and Takafumi Koshinaka and Koichi Shinoda},
url = {https://doi.org/10.21437/Odyssey.2020-65},
doi = {10.21437/Odyssey.2020-65},
year = {2020},
date = {2020-01-01},
booktitle = {Odyssey 2020: The Speaker and Language Recognition Workshop, 1-5 November
2020, Tokyo, Japan},
pages = {451--458},
publisher = {ISCA},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
2019
|
Qiang Huang; Thomas Hain: Detecting Mismatch Between Speech and Transcription Using Cross-Modal
Attention. In: Kubin, Gernot; Kacic, Zdravko (Ed.): Interspeech 2019, 20th Annual Conference of the International Speech
Communication Association, Graz, Austria, 15-19 September 2019, pp. 584–588, ISCA, 2019. @inproceedings{DBLP:conf/interspeech/HuangH19,
title = {Detecting Mismatch Between Speech and Transcription Using Cross-Modal
Attention},
author = {Qiang Huang and Thomas Hain},
editor = {Gernot Kubin and Zdravko Kacic},
url = {https://doi.org/10.21437/Interspeech.2019-2125},
doi = {10.21437/Interspeech.2019-2125},
year = {2019},
date = {2019-01-01},
booktitle = {Interspeech 2019, 20th Annual Conference of the International Speech
Communication Association, Graz, Austria, 15-19 September 2019},
pages = {584--588},
publisher = {ISCA},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|