2023
|
Rehan Ahmad; Md Asif Jalal; Muhammad Umar Farooq; Anna Ollerenshaw; Thomas Hain: Towards Domain Generalisation in ASR with Elitist Sampling and Ensemble Knowledge Distillation. In: IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), 2023, IEEE, 2023. @inproceedings{ahmad2023kd,
title = {Towards Domain Generalisation in ASR with Elitist Sampling and Ensemble Knowledge Distillation},
author = {Rehan Ahmad and Md Asif Jalal and Muhammad Umar Farooq and Anna Ollerenshaw and Thomas Hain},
url = {https://arxiv.org/pdf/2303.00550.pdf},
doi = {10.1109/ICASSP49357.2023.10095746},
year = {2023},
date = {2023-05-05},
urldate = {2023-05-05},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), 2023},
publisher = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
2022
|
Thomas Hain; Md Asif Jalal; Anna Ollerenshaw: Insights of Neural Representations in Multi-Banded and Multi-Channel Convolutional Transformers for End-to-End ASR. In: IEEE 30th European Signal Processing Conference, EUSIPCO 2022, Belgrade, Serbia, August 29 - September 2, 2022, 2022. @inproceedings{Ollerenshaw2022,
title = {Insights of Neural Representations in Multi-Banded and Multi-Channel Convolutional Transformers for End-to-End ASR},
author = {Thomas Hain and Md Asif Jalal and Anna Ollerenshaw},
year = {2022},
date = {2022-01-01},
urldate = {2022-01-01},
booktitle = {IEEE 30th European Signal Processing Conference, EUSIPCO 2022, Belgrade, Serbia, August 29 - September 2, 2022},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
2021
|
Jose Antonio Lopez Saenz; Md Asif Jalal; Rosanna Milner; Thomas Hain: Attention Based Model for Segmental Pronunciation Error Detection. In: IEEE Automatic Speech Recognition and Understanding Workshop, ASRU
2021, Cartagena, Colombia, December 13-17, 2021, pp. 725–732, IEEE, 2021. @inproceedings{DBLP:conf/asru/SaenzJMH21,
title = {Attention Based Model for Segmental Pronunciation Error Detection},
author = {Jose Antonio Lopez Saenz and Md Asif Jalal and Rosanna Milner and Thomas Hain},
url = {https://doi.org/10.1109/ASRU51503.2021.9687993},
doi = {10.1109/ASRU51503.2021.9687993},
year = {2021},
date = {2021-01-01},
booktitle = {IEEE Automatic Speech Recognition and Understanding Workshop, ASRU
2021, Cartagena, Colombia, December 13-17, 2021},
pages = {725--732},
publisher = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Anna Ollerenshaw; Md Asif Jalal; Thomas Hain: Insights on Neural Representations for End-to-End Speech Recognition. In: Hermansky, Hynek; Cernocký, Honza; Burget, Lukás; Lamel, Lori; Scharenborg, Odette; Motlícek, Petr (Ed.): Interspeech 2021, 22nd Annual Conference of the International Speech
Communication Association, Brno, Czechia, 30 August - 3 September
2021, pp. 4079–4083, ISCA, 2021. @inproceedings{DBLP:conf/interspeech/OllerenshawJH21,
title = {Insights on Neural Representations for End-to-End Speech Recognition},
author = {Anna Ollerenshaw and Md Asif Jalal and Thomas Hain},
editor = {Hynek Hermansky and Honza Cernocký and Lukás Burget and Lori Lamel and Odette Scharenborg and Petr Motlícek},
url = {https://doi.org/10.21437/Interspeech.2021-1516},
doi = {10.21437/Interspeech.2021-1516},
year = {2021},
date = {2021-01-01},
urldate = {2021-01-01},
booktitle = {Interspeech 2021, 22nd Annual Conference of the International Speech
Communication Association, Brno, Czechia, 30 August - 3 September
2021},
pages = {4079--4083},
publisher = {ISCA},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
2020
|
Md Asif Jalal; Rosanna Milner; Thomas Hain; Roger K. Moore: Removing Bias with Residual Mixture of Multi-View Attention for Speech
Emotion Recognition. In: Meng, Helen; Xu, Bo; Zheng, Thomas Fang (Ed.): Interspeech 2020, 21st Annual Conference of the International Speech
Communication Association, Virtual Event, Shanghai, China, 25-29 October
2020, pp. 4084–4088, ISCA, 2020. @inproceedings{DBLP:conf/interspeech/JalalMHM20,
title = {Removing Bias with Residual Mixture of Multi-View Attention for Speech
Emotion Recognition},
author = {Md Asif Jalal and Rosanna Milner and Thomas Hain and Roger K. Moore},
editor = {Helen Meng and Bo Xu and Thomas Fang Zheng},
url = {https://doi.org/10.21437/Interspeech.2020-3005},
doi = {10.21437/Interspeech.2020-3005},
year = {2020},
date = {2020-01-01},
booktitle = {Interspeech 2020, 21st Annual Conference of the International Speech
Communication Association, Virtual Event, Shanghai, China, 25-29 October
2020},
pages = {4084--4088},
publisher = {ISCA},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Md Asif Jalal; Rosanna Milner; Thomas Hain: Empirical Interpretation of Speech Emotion Perception with Attention Based Model for Speech Emotion Recognition. In: Meng, Helen; Xu, Bo; Zheng, Thomas Fang (Ed.): Interspeech 2020, 21st Annual Conference of the International Speech
Communication Association, Virtual Event, Shanghai, China, 25-29 October
2020, pp. 4113–4117, ISCA, 2020. @inproceedings{DBLP:conf/interspeech/JalalMH20,
title = {Empirical Interpretation of Speech Emotion Perception with Attention Based Model for Speech Emotion Recognition},
author = {Md Asif Jalal and Rosanna Milner and Thomas Hain},
editor = {Helen Meng and Bo Xu and Thomas Fang Zheng},
url = {https://doi.org/10.21437/Interspeech.2020-3007},
doi = {10.21437/Interspeech.2020-3007},
year = {2020},
date = {2020-01-01},
urldate = {2020-01-01},
booktitle = {Interspeech 2020, 21st Annual Conference of the International Speech
Communication Association, Virtual Event, Shanghai, China, 25-29 October
2020},
pages = {4113--4117},
publisher = {ISCA},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
2019
|
Rosanna Milner; Md Asif Jalal; Raymond W. M. Ng; Thomas Hain: A Cross-Corpus Study on Speech Emotion Recognition. In: IEEE Automatic Speech Recognition and Understanding Workshop, ASRU
2019, Singapore, December 14-18, 2019, pp. 304–311, IEEE, 2019. @inproceedings{DBLP:conf/asru/MilnerJNH19,
title = {A Cross-Corpus Study on Speech Emotion Recognition},
author = {Rosanna Milner and Md Asif Jalal and Raymond W. M. Ng and Thomas Hain},
url = {https://doi.org/10.1109/ASRU46091.2019.9003838},
doi = {10.1109/ASRU46091.2019.9003838},
year = {2019},
date = {2019-01-01},
booktitle = {IEEE Automatic Speech Recognition and Understanding Workshop, ASRU
2019, Singapore, December 14-18, 2019},
pages = {304--311},
publisher = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Md Asif Jalal; Roger K. Moore; Thomas Hain: Spatio-Temporal Context Modelling for Speech Emotion Classification. In: IEEE Automatic Speech Recognition and Understanding Workshop, ASRU
2019, Singapore, December 14-18, 2019, pp. 853–859, IEEE, 2019. @inproceedings{DBLP:conf/asru/JalalMH19,
title = {Spatio-Temporal Context Modelling for Speech Emotion Classification},
author = {Md Asif Jalal and Roger K. Moore and Thomas Hain},
url = {https://doi.org/10.1109/ASRU46091.2019.9004037},
doi = {10.1109/ASRU46091.2019.9004037},
year = {2019},
date = {2019-01-01},
booktitle = {IEEE Automatic Speech Recognition and Understanding Workshop, ASRU
2019, Singapore, December 14-18, 2019},
pages = {853--859},
publisher = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Hardik B. Sailor; Salil Deena; Md Asif Jalal; Rasa Lileikyte; Thomas Hain: Unsupervised Adaptation of Acoustic Models for ASR Using Utterance-Level
Embeddings from Squeeze and Excitation Networks. In: IEEE Automatic Speech Recognition and Understanding Workshop, ASRU
2019, Singapore, December 14-18, 2019, pp. 980–987, IEEE, 2019. @inproceedings{DBLP:conf/asru/SailorDJLH19,
title = {Unsupervised Adaptation of Acoustic Models for ASR Using Utterance-Level
Embeddings from Squeeze and Excitation Networks},
author = {Hardik B. Sailor and Salil Deena and Md Asif Jalal and Rasa Lileikyte and Thomas Hain},
url = {https://doi.org/10.1109/ASRU46091.2019.9003755},
doi = {10.1109/ASRU46091.2019.9003755},
year = {2019},
date = {2019-01-01},
booktitle = {IEEE Automatic Speech Recognition and Understanding Workshop, ASRU
2019, Singapore, December 14-18, 2019},
pages = {980--987},
publisher = {IEEE},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Md Asif Jalal; Erfan Loweimi; Roger K. Moore; Thomas Hain: Learning Temporal Clusters Using Capsule Routing for Speech Emotion
Recognition. In: Kubin, Gernot; Kacic, Zdravko (Ed.): Interspeech 2019, 20th Annual Conference of the International Speech
Communication Association, Graz, Austria, 15-19 September 2019, pp. 1701–1705, ISCA, 2019. @inproceedings{DBLP:conf/interspeech/JalalLMH19,
title = {Learning Temporal Clusters Using Capsule Routing for Speech Emotion
Recognition},
author = {Md Asif Jalal and Erfan Loweimi and Roger K. Moore and Thomas Hain},
editor = {Gernot Kubin and Zdravko Kacic},
url = {https://doi.org/10.21437/Interspeech.2019-3068},
doi = {10.21437/Interspeech.2019-3068},
year = {2019},
date = {2019-01-01},
booktitle = {Interspeech 2019, 20th Annual Conference of the International Speech
Communication Association, Graz, Austria, 15-19 September 2019},
pages = {1701--1705},
publisher = {ISCA},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
|