Publications
2026
Hand gesture realisation of contrastive focus in real-time whisper-to-speech synthesis: Investigating the transfer from implicit to explicit control of intonation
Delphine Charuau, Nathalie Henrich Bernardoni, Gerber, Silvain and Perrotin, Olivier
Speech Communication , vol. 177 , pp. 103344
@article{Charuau2026,
title = {Hand gesture realisation of contrastive focus in real-time
whisper-to-speech synthesis: Investigating the transfer from implicit to
explicit control of intonation
},
author = {Charuau, Delphine and Henrich Bernardoni, Nathalie and Gerber, Silvain and
Perrotin, Olivier
},
year = {2026},
month = {feb},
journal = {Speech Communication},
publisher = {Elsevier BV},
volume = {177},
pages = {103344},
doi = {10.1016/j.specom.2025.103344},
issn = {0167-6393},
url = {http://dx.doi.org/10.1016/j.specom.2025.103344}
} From Hype to Insight: Rethinking Large Language Model Integration in Visual Speech Recognition
Rishabh Jain, Naomi Harte
ICASSP 2026 - 2026 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP) , pp. 18717–18721
@inproceedings{Jain2026,
title = {From Hype to Insight: Rethinking Large Language Model Integration in Visual
Speech Recognition
},
author = {Jain, Rishabh and Harte, Naomi},
year = {2026},
month = {may},
booktitle = {ICASSP 2026 - 2026 IEEE International Conference on Acoustics, Speech and
Signal Processing (ICASSP)
},
publisher = {Ieee},
pages = {18717–18721},
doi = {10.1109/icassp55912.2026.11464703},
url = {http://dx.doi.org/10.1109/icassp55912.2026.11464703}
} The Role of Prosodic and Lexical Cues in Turn-Taking with Self-Supervised Speech Representations
Sam O'Connor Russell, Delphine Charuau, Naomi Harte
ICASSP 2026 - 2026 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP) , pp. 16307–16311
@inproceedings{Russell2026,
title = {The Role of Prosodic and Lexical Cues in Turn-Taking with Self-Supervised
Speech Representations
},
author = {Russell, Sam O'Connor and Charuau, Delphine and Harte, Naomi},
year = {2026},
month = {may},
booktitle = {ICASSP 2026 - 2026 IEEE International Conference on Acoustics, Speech and
Signal Processing (ICASSP)
},
publisher = {Ieee},
pages = {16307–16311},
doi = {10.1109/icassp55912.2026.11464984},
url = {http://dx.doi.org/10.1109/icassp55912.2026.11464984}
} 2025
Impact of a Sharpness Based Loss Function for Removing Out-of-Focus Blur
Uditangshu Aurangabadkar, Darren Ramsook, Anil Kokaram
2025 33rd European Signal Processing Conference (EUSIPCO) , pp. 601–605
@inproceedings{Aurangabadkar2025,
title = {Impact of a Sharpness Based Loss Function for Removing Out-of-Focus Blur},
author = {Aurangabadkar, Uditangshu and Ramsook, Darren and Kokaram, Anil},
year = {2025},
month = {sep},
booktitle = {2025 33rd European Signal Processing Conference (EUSIPCO)},
publisher = {Ieee},
pages = {601–605},
doi = {10.23919/eusipco63237.2025.11226201},
url = {http://dx.doi.org/10.23919/eusipco63237.2025.11226201}
} Hot topics in speech synthesis evaluation
Gérard Bailly, Elisabeth André, Erica Cooper, Esther Klabbers, Benjamin Cowan et al.
13th edition of the Speech Synthesis Workshop , pp. 1–7
@inproceedings{Bailly2025,
title = {Hot topics in speech synthesis evaluation},
author = {Bailly, G\'{e}rard and Andr\'{e}, Elisabeth and Cooper, Erica and Klabbers,
Esther and Cowan, Benjamin and Edlund, Jens and Harte, Naomi and King,
Simon and Le Maguer, S\'{e}bastien and Moore, Roger K. and M\"{o}bius,
Bernd and M\"{o}ller, Sebastian and Pandey, Ayushi and Perrotin, Olivier
and Seebauer, Fritz and Str\"{o}mbergsson, Sofia and Traum, David R. and
T\aa{}nnander, Christina and Wagner, Petra and Yamagishi, Junichi and
Yasuda, Yusuke
},
year = {2025},
month = {aug},
booktitle = {13th edition of the Speech Synthesis Workshop},
publisher = {Isca},
series = {ssw\_2025},
pages = {1–7},
doi = {10.21437/ssw.2025-1},
url = {http://dx.doi.org/10.21437/ssw.2025-1},
collection = {ssw\_2025}
} Multi Task Denoiser Training for Solving Linear Inverse Problems
Clément Bled, François Pitié
Proceedings of the 22nd ACM SIGGRAPH European Conference on Visual Media Production , pp. 1–9
@inproceedings{Bled2025,
title = {Multi Task Denoiser Training for Solving Linear Inverse Problems},
author = {Bled, Cl\'{e}ment and Piti\'{e}, Fran\c{c}ois},
year = {2025},
month = {dec},
booktitle = {Proceedings of the 22nd ACM SIGGRAPH European Conference on Visual Media
Production
},
publisher = {Acm},
series = {Cvmp '25},
pages = {1–9},
doi = {10.1145/3756863.3769703},
url = {http://dx.doi.org/10.1145/3756863.3769703},
collection = {Cvmp '25}
} Multimodal Dynamics of Hand Gestures and Pauses in Multiparty Interactions
Delphine Charuau, Naomi Harte
Interspeech 2025 , pp. 3030–3034
@inproceedings{Charuau2025,
title = {Multimodal Dynamics of Hand Gestures and Pauses in Multiparty Interactions},
author = {Charuau, Delphine and Harte, Naomi},
year = {2025},
month = {aug},
booktitle = {Interspeech 2025},
publisher = {Isca},
series = {interspeech\_2025},
pages = {3030–3034},
doi = {10.21437/interspeech.2025-959},
url = {http://dx.doi.org/10.21437/interspeech.2025-959},
collection = {interspeech\_2025}
} Efficient motion-based metrics for video frame interpolation
Conall Daly, Darren Ramsook, Anil Kokaram
Applications of Digital Image Processing XLVIII , pp. 46
@inproceedings{Daly2025a,
title = {Efficient motion-based metrics for video frame interpolation},
author = {Daly, Conall and Ramsook, Darren and Kokaram, Anil},
year = {2025},
month = {sep},
booktitle = {Applications of Digital Image Processing XLVIII},
publisher = {Spie},
pages = {46},
doi = {10.1117/12.3063574},
url = {http://dx.doi.org/10.1117/12.3063574},
editor = {Tescher, Andrew G. and Ebrahimi, Touradj}
} An Efficient Quality Metric for Video Frame Interpolation Based on Motion-Field Divergence
Conall Daly, Darren Ramsook, Anil Kokaram
2025 17th International Conference on Quality of Multimedia Experience (QoMEX) , pp. 1–7
@inproceedings{Daly2025b,
title = {An Efficient Quality Metric for Video Frame Interpolation Based on
Motion-Field Divergence
},
author = {Daly, Conall and Ramsook, Darren and Kokaram, Anil},
year = {2025},
month = {sep},
booktitle = {2025 17th International Conference on Quality of Multimedia Experience
(QoMEX)
},
publisher = {Ieee},
pages = {1–7},
doi = {10.1109/qomex65720.2025.11219984},
url = {http://dx.doi.org/10.1109/qomex65720.2025.11219984}
} Enabling the replicability of speech synthesis perceptual evaluations
Sébastien Le Maguer, Gwénolé Lecorvé, Damien Lolive, Naomi Harte, Juraj Šimko
Interspeech 2025 , pp. 2545–2549
@inproceedings{Le_Maguer2025,
title = {Enabling the replicability of speech synthesis perceptual evaluations},
author = {Le Maguer, S\'{e}bastien and Lecorv\'{e}, Gw\'{e}nol\'{e} and Lolive,
Damien and Harte, Naomi and \v{S}imko, Juraj
},
year = {2025},
month = {aug},
booktitle = {Interspeech 2025},
publisher = {Isca},
series = {interspeech\_2025},
pages = {2545–2549},
doi = {10.21437/interspeech.2025-401},
url = {http://dx.doi.org/10.21437/interspeech.2025-401},
collection = {interspeech\_2025}
} Uncovering the Visual Contribution in Audio-Visual Speech Recognition
Zhaofeng Lin, Naomi Harte
ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP) , pp. 1–5
@inproceedings{Lin2025,
title = {Uncovering the Visual Contribution in Audio-Visual Speech Recognition},
author = {Lin, Zhaofeng and Harte, Naomi},
year = {2025},
month = {apr},
booktitle = {ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and
Signal Processing (ICASSP)
},
publisher = {Ieee},
pages = {1–5},
doi = {10.1109/icassp49660.2025.10888423},
url = {http://dx.doi.org/10.1109/icassp49660.2025.10888423}
} Interpreting the Role of Visemes in Audio-Visual Speech Recognition
Aristeidis Papadopoulos, Naomi Harte
2025 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU) , pp. 1–8
@inproceedings{Papadopoulos2025,
title = {Interpreting the Role of Visemes in Audio-Visual Speech Recognition},
author = {Papadopoulos, Aristeidis and Harte, Naomi},
year = {2025},
month = {dec},
booktitle = {2025 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)},
publisher = {Ieee},
pages = {1–8},
doi = {10.1109/asru65441.2025.11434749},
url = {http://dx.doi.org/10.1109/asru65441.2025.11434749}
} Visual Cues Enhance Predictive Turn-Taking for Two-Party Human Interaction
Sam O'Connor Russell, Naomi Harte
Findings of the Association for Computational Linguistics: ACL 2025 , pp. 209–221
@article{Russell2025a,
title = {Visual Cues Enhance Predictive Turn-Taking for Two-Party Human Interaction},
author = {Sam O'Connor Russell and Naomi Harte},
year = {2025},
journal = {Findings of the Association for Computational Linguistics: ACL 2025},
pages = {209–221},
doi = {https://doi.org/10.18653/v1/2025.findings-acl.12},
url = {https://aclanthology.org/2025.findings-acl.12/},
keywords = {Turn-taking, Conversation, Multimodal interaction, Automatic speech
recognition, Open-source, Speech technology
}
} Visual Cues Support Robust Turn-taking Prediction in Noise
Sam O'Connor Russell, Naomi Harte
Interspeech 2025 , pp. 1073--1077
@article{Russell2025b,
title = {Visual Cues Support Robust Turn-taking Prediction in Noise},
author = {Sam O'Connor Russell and Naomi Harte},
year = {2025},
journal = {Interspeech 2025},
pages = {1073--1077},
doi = {https://www.isca-archive.org/interspeech_2025/oconnorrussell25_interspeech.html#
},
url = {https://www.isca-archive.org/interspeech_2025/oconnorrussell25_interspeech.html#
},
keywords = {Turn-taking, Conversation, Multimodal interaction, Automatic speech
recognition, Open-source, Speech technolog, Noise, Robust
}
} An Empirical Study of Reducing AV1 Decoder Complexity and Energy Consumption via Encoder Parameter Tuning
Vibhoothi Vibhoothi, Julien Zouein, Shanker Shreejith, Jean-Baptiste Kempf, Anil Kokaram
2025 Picture Coding Symposium (PCS) , pp. 1–5
@inproceedings{Vibhoothi2025a,
title = {An Empirical Study of Reducing AV1 Decoder Complexity and Energy
Consumption via Encoder Parameter Tuning
},
author = {Vibhoothi, Vibhoothi and Zouein, Julien and Shreejith, Shanker and Kempf,
Jean-Baptiste and Kokaram, Anil
},
year = {2025},
month = {dec},
booktitle = {2025 Picture Coding Symposium (PCS)},
publisher = {Ieee},
pages = {1–5},
doi = {10.1109/pcs65673.2025.11417575},
url = {http://dx.doi.org/10.1109/pcs65673.2025.11417575}
} LiteVPNet: A Lightweight Network for Video Encoding Control in Quality-Critical Applications
Vibhoothi Vibhoothi, François Pitié, Anil Kokaram
2025 Picture Coding Symposium (PCS) , pp. 1–5
@inproceedings{Vibhoothi2025b,
title = {LiteVPNet: A Lightweight Network for Video Encoding Control in
Quality-Critical Applications
},
author = {Vibhoothi, Vibhoothi and Piti\'{e}, Fran\c{c}ois and Kokaram, Anil},
year = {2025},
month = {dec},
booktitle = {2025 Picture Coding Symposium (PCS)},
publisher = {Ieee},
pages = {1–5},
doi = {10.1109/pcs65673.2025.11417531},
url = {http://dx.doi.org/10.1109/pcs65673.2025.11417531}
} AV1 Motion Vector Fidelity and Application for Efficient Optical Flow
Julien Zouein, Vibhoothi Vibhoothi, Anil Kokaram
2025 Picture Coding Symposium (PCS) , pp. 1–5
@inproceedings{Zouein2025,
title = {AV1 Motion Vector Fidelity and Application for Efficient Optical Flow},
author = {Zouein, Julien and Vibhoothi, Vibhoothi and Kokaram, Anil},
year = {2025},
month = {dec},
booktitle = {2025 Picture Coding Symposium (PCS)},
publisher = {Ieee},
pages = {1–5},
doi = {10.1109/pcs65673.2025.11417638},
url = {http://dx.doi.org/10.1109/pcs65673.2025.11417638}
} 2024
A Dictionary Based Approach for Removing Out-of-Focus Blur
Uditangshu Aurangabadkar, Anil Kokaram
2024 IEEE International Conference on Image Processing (ICIP) , pp. 1494--1499
@inproceedings{Aurangabadkar2024a,
title = {A Dictionary Based Approach for Removing Out-of-Focus Blur},
author = {Aurangabadkar, Uditangshu and Kokaram, Anil},
year = {2024},
booktitle = {2024 IEEE International Conference on Image Processing (ICIP)},
pages = {1494--1499},
doi = {10.1109/icip51287.2024.10647453},
keywords = {Measurement;Deep learning;Dictionaries;Computational
modeling;Superresolution;Image restoration;Computational
efficiency;Deblurring;Restoration;Optical Blur;Learned Filters;Sharpness
}
} A Sharpness Based Loss Function for Removing Out-of-Focus Blur
Uditangshu Aurangabadkar, Darren Ramsook, Anil Kokaram
2024 IEEE 26th International Workshop on Multimedia Signal Processing (MMSP) , pp. 1--6
@inproceedings{Aurangabadkar2024b,
title = {A Sharpness Based Loss Function for Removing Out-of-Focus Blur},
author = {Aurangabadkar, Uditangshu and Ramsook, Darren and Kokaram, Anil},
year = {2024},
booktitle = {2024 IEEE 26th International Workshop on Multimedia Signal Processing
(MMSP)
},
pages = {1--6},
doi = {10.1109/mmsp61759.2024.10743912},
keywords = {Measurement;Image edge detection;Conferences;Artificial neural
networks;Signal processing;Image
restoration;Standards;Optimization;Deblurring;Perceptual Loss;Optical
blur;Dataset
}
} Lightweight Video Denoising Using a Classic Bayesian Backbone
Clément Bled, François Pitié
2024 IEEE International Conference on Multimedia and Expo (ICME) , pp. 1–6
@inproceedings{Bled2024,
title = {Lightweight Video Denoising Using a Classic Bayesian Backbone},
author = {Bled, Cl\'{e}ment and Piti\'{e}, Fran\c{c}ois},
year = {2024},
month = {jul},
booktitle = {2024 IEEE International Conference on Multimedia and Expo (ICME)},
publisher = {Ieee},
pages = {1–6},
doi = {10.1109/icme57554.2024.10688172},
url = {http://dx.doi.org/10.1109/icme57554.2024.10688172},
keywords = {Wiener filters;Costs;Noise;Closed box;Streaming media;Transformers;Motion
compensation;Bayes methods;Video Denoising;Image Sequence Denoising;Wiener
Filter
}
} Training speech-breathing coordination in computer-assisted reading
Delphine Charuau, Andrea Briglia, Erika Godde, Gérard Bailly
Interspeech 2024 , pp. 5128–5132
@inproceedings{Charuau2024,
title = {Training speech-breathing coordination in computer-assisted reading},
author = {Charuau, Delphine and Briglia, Andrea and Godde, Erika and Bailly,
G\'{e}rard
},
year = {2024},
month = {sep},
booktitle = {Interspeech 2024},
publisher = {Isca},
series = {interspeech\_2024},
pages = {5128–5132},
doi = {10.21437/interspeech.2024-992},
url = {http://dx.doi.org/10.21437/interspeech.2024-992},
collection = {interspeech\_2024}
} Joint Speech-Text Embeddings for Multitask Speech Processing
Michael Gian Gonzales, Peter Corcoran, Naomi Harte, Michael Schukat
IEEE Access , vol. 12 , pp. 145955–145967
@article{Gonzales2024,
title = {Joint Speech-Text Embeddings for Multitask Speech Processing},
author = {Gonzales, Michael Gian and Corcoran, Peter and Harte, Naomi and Schukat,
Michael
},
year = {2024},
journal = {IEEE Access},
publisher = {Institute of Electrical and Electronics Engineers (IEEE)},
volume = {12},
pages = {145955–145967},
doi = {10.1109/access.2024.3473743},
issn = {2169-3536},
url = {http://dx.doi.org/10.1109/access.2024.3473743}
} Demystifying the use of Compression in Virtual Production
Anil Kokaram, Vibhoothi Vibhoothi, Zouein, Julien and Pitié, François, Christopher Nash, James Bentley et al.
SMPTE Media Technology Summit 2024
@article{Kokaram2024,
title = {Demystifying the use of Compression in Virtual Production},
author = {{Kokaram}, Anil and {Vibhoothi}, Vibhoothi and {Zouein}, Julien and
{Piti{\'e}}, Fran{\c{c}}ois and {Nash}, Christopher and {Bentley}, James
and {Coulam-Jones}, Philip
},
year = {2024},
month = {oct},
journal = {SMPTE Media Technology Summit 2024},
publisher = {Smpte}
} The limits of the Mean Opinion Score for speech synthesis evaluation
Sébastien Le Maguer, Simon King, Naomi Harte
Computer Speech & Language , vol. 84 , pp. 101577
@article{Maguer2024,
title = {The limits of the Mean Opinion Score for speech synthesis evaluation},
author = {S\'{e}bastien {Le Maguer} and Simon King and Naomi Harte},
year = {2024},
journal = {Computer Speech \& Language},
volume = {84},
pages = {101577},
doi = {https://doi.org/10.1016/j.csl.2023.101577},
issn = {0885-2308},
url = {https://www.sciencedirect.com/science/article/pii/S0885230823000967},
keywords = {Speech synthesis evaluation, Absolute Category Rating, Mean Opinion Score,
Blizzard Challenge
}
} A Neural Enhancement Post-Processor with a Dynamic AV1 Encoder Configuration Strategy for CLIC 2024
Darren Ramsook, Anil Kokaram
2024 Data Compression Conference (DCC) , pp. 372--381
@inproceedings{Ramsook2024a,
title = {A Neural Enhancement Post-Processor with a Dynamic AV1 Encoder
Configuration Strategy for CLIC 2024
},
author = {Ramsook, Darren and Kokaram, Anil},
year = {2024},
booktitle = {2024 Data Compression Conference (DCC)},
pages = {372--381},
doi = {10.1109/dcc58796.2024.00045},
keywords = {Training;Bit rate;Pipelines;Data compression;Video compression;Streaming
media;Perceptual Enhancement;Perceptual Video Compression Pipeline;Neural
Video Enhancement
}
} Comparative Analysis of Subjective Evaluations for Traditional and Neural-Based Video Enhancement Techniques
Darren Ramsook, Vibhoothi, Anil Kokaram, Katsenou, Angeliki and Bull, David
2024 16th International Conference on Quality of Multimedia Experience (QoMEX) , pp. 242--245
@inproceedings{Ramsook2024b,
title = {Comparative Analysis of Subjective Evaluations for Traditional and
Neural-Based Video Enhancement Techniques
},
author = {Ramsook, Darren and Vibhoothi and Kokaram, Anil and Katsenou, Angeliki and
Bull, David
},
year = {2024},
booktitle = {2024 16th International Conference on Quality of Multimedia Experience
(QoMEX)
},
pages = {242--245},
doi = {10.1109/QoMEX61742.2024.10598241},
keywords = {Measurement;Streaming media;Observers;Quality assessment;Video
recording;Subjective analysis;video restoration;perceptual criteria
}
} What automatic speech recognition can and cannot do for conversational speech transcription
Sam O'Connor Russell, Iona Gessinger, Anna Krason, Gabriella Vigliocco, Naomi Harte
Research Methods in Applied Linguistics , vol. 3 , no. 3 , pp. 100163
@article{Russell2024,
title = {What automatic speech recognition can and cannot do for conversational
speech transcription
},
author = {Sam O'Connor Russell and Iona Gessinger and Anna Krason and Gabriella
Vigliocco and Naomi Harte
},
year = {2024},
journal = {Research Methods in Applied Linguistics},
volume = {3},
number = {3},
pages = {100163},
doi = {https://doi.org/10.1016/j.rmal.2024.100163},
issn = {2772-7661},
url = {https://www.sciencedirect.com/science/article/pii/S2772766124000697},
keywords = {Transcription, Automatic speech recognition, Open-source, Speech technology
}
} Predicting total time to compress a video corpus using online inference systems
Xin Shu, Vibhoothi Vibhoothi, Anil Kokaram
2024 IEEE International Conference on Visual Communications and Image Processing (VCIP) , pp. 1–5
@inproceedings{Shu2024,
title = {Predicting total time to compress a video corpus using online inference
systems
},
author = {Shu, Xin and Vibhoothi, Vibhoothi and Kokaram, Anil},
year = {2024},
month = {dec},
booktitle = {2024 IEEE International Conference on Visual Communications and Image
Processing (VCIP)
},
publisher = {Ieee},
pages = {1–5},
doi = {10.1109/vcip63160.2024.10849826},
url = {http://dx.doi.org/10.1109/vcip63160.2024.10849826}
} Using Single-Pass Look-Ahead in Modern Codecs for Optimized Transcoding Deployment
Vibhoothi Vibhoothi, Julien Zouein, Pitié, François and Kokaram, Anil
SMPTE Motion Imaging Journal , vol. 133 , no. 6
@article{Vibhoothi2024a,
title = {Using Single-Pass Look-Ahead in Modern Codecs for Optimized Transcoding
Deployment
},
author = {Vibhoothi, Vibhoothi and Zouein, Julien and Piti\'{e}, Fran\c{c}ois and
Kokaram, Anil
},
year = {2024},
month = {oct},
journal = {SMPTE Motion Imaging Journal},
publisher = {Society of Motion Picture and Television Engineers (SMPTE)},
volume = {133},
number = {6},
doi = {10.5594/jmi.2024/wssg3140},
issn = {2160-2492},
url = {http://dx.doi.org/10.5594/jmi.2024/wssg3140}
} Unravelling the Power of Single-Pass Look-Ahead in Modern Codecs for Optimized Transcoding Deployment
Vibhoothi Vibhoothi, Julien Zouein, François Pitié, Anil Kokaram
NAB Broadcast Engineering and Information Technology (BEIT) Conference
@misc{Vibhoothi2024b,
title = {Unravelling the Power of Single-Pass Look-Ahead in Modern Codecs for
Optimized Transcoding Deployment
},
author = {Vibhoothi Vibhoothi and Julien Zouein and Fran\c{c}ois Piti\'{e} and Anil
Kokaram
},
year = {2024},
journal = {NAB Broadcast Engineering and Information Technology (BEIT) Conference},
publisher = {National Association of Broadcaster}
} 2023
Learnable Frontends That Do Not Learn: Quantifying Sensitivity To Filterbank Initialisation
Mark Anderson, Tomi Kinnunen, Naomi Harte
ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP) , pp. 1--5
@inproceedings{Anderson2023,
title = {Learnable Frontends That Do Not Learn: Quantifying Sensitivity To
Filterbank Initialisation
},
author = {Anderson, Mark and Kinnunen, Tomi and Harte, Naomi},
year = {2023},
booktitle = {ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and
Signal Processing (ICASSP)
},
pages = {1--5},
doi = {10.1109/icassp49357.2023.10095474},
keywords = {Training;Voice activity detection;Sensitivity;Neural networks;Signal
processing;Acoustics;Gabor filters;Learnable Filterbanks;LEAF;Learnable
Frontend;Sensitivity;Initialisation
}
} Pushing the Limits of the Wiener Filter in Image Denoising
Clément Bled, François Pitié
2023 IEEE International Conference on Image Processing (ICIP) , pp. 2590--2594
@inproceedings{Bled2023,
title = {Pushing the Limits of the Wiener Filter in Image Denoising},
author = {Bled, Cl\'{e}ment and Piti\'{e}, Fran\c{c}ois},
year = {2023},
booktitle = {2023 IEEE International Conference on Image Processing (ICIP)},
pages = {2590--2594},
doi = {10.1109/icip49359.2023.10222826},
keywords = {Wiener filters;Filtering;Neural networks;Benchmark testing;Convolutional
neural networks;Optimization;Image denoising;Image Denoising;Wiener Filter
}
} Fine Grained Spoken Document Summarization Through Text Segmentation
Samantha Kotey, Rozenn Dahyot, Naomi Harte
2022 IEEE Spoken Language Technology Workshop (SLT) , pp. 647--654
@inproceedings{Kotey2023,
title = {Fine Grained Spoken Document Summarization Through Text Segmentation},
author = {Kotey, Samantha and Dahyot, Rozenn and Harte, Naomi},
year = {2023},
booktitle = {2022 IEEE Spoken Language Technology Workshop (SLT)},
pages = {647--654},
doi = {10.1109/slt54892.2023.10022829},
keywords = {Filtering;Conferences;Training data;Oral
communication;Linguistics;Transformers;Readability metrics;spoken document
summarization;text segmentation;long sequence transformers;readability
formulas;podcast summarization
}
} Learnt Deep Hyperparameter Selection in Adversarial Training for Compressed Video Enhancement with a Perceptual Critic
Darren Ramsook, Anil Kokaram
2023 IEEE International Conference on Image Processing (ICIP) , pp. 2420--2424
@inproceedings{Ramsook2023,
title = {Learnt Deep Hyperparameter Selection in Adversarial Training for Compressed
Video Enhancement with a Perceptual Critic
},
author = {Ramsook, Darren and Kokaram, Anil},
year = {2023},
booktitle = {2023 IEEE International Conference on Image Processing (ICIP)},
pages = {2420--2424},
doi = {10.1109/icip49359.2023.10222397},
keywords = {Measurement;Training;Image coding;Neuroscience;Feature extraction;Data
mining;Compressed Video Enhancement;Perceptual Optimization;Perceptual Deep
Features
}
} The disparity between optimal and practical Lagrangian multiplier estimation in video encoders
Daniel Joseph Ringis, Vibhoothi Vibhoothi, François Pitié, Anil Kokaram
Frontiers in Signal Processing , vol. 3
@article{Ringis2023,
title = {The disparity between optimal and practical Lagrangian multiplier
estimation in video encoders
},
author = {Ringis, Daniel Joseph and Vibhoothi, Vibhoothi and Piti\'{e},
Fran\c{c}ois and Kokaram, Anil
},
year = {2023},
journal = {Frontiers in Signal Processing},
volume = {3},
doi = {10.3389/frsip.2023.1205104},
issn = {2673-8198},
url = {https://www.frontiersin.org/journals/signal-processing/articles/10.3389/frsip.2023.1205104
}
} Comparison of HDR quality metrics in Per-Clip Lagrangian multiplier optimisation with AV1
Vibhoothi Vibhoothi, François Pitié, Katsenou, Angeliki and Su, Yeping, Balu Adsumilli, Anil Kokaram
2023 IEEE International Conference on Multimedia and Expo (ICME) , pp. 1655--1660
@inproceedings{Vibhoothi2023a,
title = {Comparison of HDR quality metrics in Per-Clip Lagrangian multiplier
optimisation with AV1
},
author = {Vibhoothi, Vibhoothi and Piti\'{e}, Fran\c{c}ois and Katsenou, Angeliki and
Su, Yeping and Adsumilli, Balu and Kokaram, Anil
},
year = {2023},
booktitle = {2023 IEEE International Conference on Multimedia and Expo (ICME)},
pages = {1655--1660},
doi = {10.1109/icme55011.2023.00285},
keywords = {Measurement;Codecs;Rate-distortion;ITU;High dynamic range;Complexity
theory;Optimization;HDR;Quality Metrics;AV1;Rate-Distortion Optimisation
}
} Filling the gaps in video transcoder deployment in the cloud
Vibhoothi, Daniel Joseph Ringis, Xin Shu, François Pitié, Zsolt Lorincz et al.
NAB Broadcast Engineering and Information Technology (BEIT) Conference
@misc{Vibhoothi2023b,
title = {Filling the gaps in video transcoder deployment in the cloud},
author = {Vibhoothi and Daniel Joseph Ringis and Xin Shu and Fran\c{c}ois Piti\'{e}
and Zsolt Lorincz and Philippe Brodeur and Anil Kokaram
},
year = {2023},
journal = {NAB Broadcast Engineering and Information Technology (BEIT) Conference},
publisher = {National Association of Broadcaster},
url = {https://arxiv.org/abs/2304.08634}
} Recommendations for Verifying HDR Subjective Testing Workflows
Vibhoothi Vibhoothi, Angeliki Katsenou, Squires, John and Pitié, Francois, Anil Kokaram
2023 15th International Conference on Quality of Multimedia Experience (QoMEX) , pp. 197--200
@inproceedings{Vibhoothi2023c,
title = {Recommendations for Verifying HDR Subjective Testing Workflows},
author = {Vibhoothi, Vibhoothi and Katsenou, Angeliki and Squires, John and
Piti\'{e}, Francois and Kokaram, Anil
},
year = {2023},
booktitle = {2023 15th International Conference on Quality of Multimedia Experience
(QoMEX)
},
pages = {197--200},
doi = {10.1109/QoMEX58391.2023.10178488},
keywords = {TV;Brightness;Pipelines;Color;Production;Organic light emitting
diodes;Encoding;HDR;testing workflow;testing environment;playback;video
coding
}
} Subjective Assessment of the Impact of a Content Adaptive Optimiser for Compressing 4K HDR Content With AV1
Vibhoothi Vibhoothi, Angeliki Katsenou, Pitié, François and Domijan, Katarina, Anil Kokaram
2023 IEEE International Conference on Image Processing (ICIP) , pp. 2610--2614
@inproceedings{Vibhoothi2023d,
title = {Subjective Assessment of the Impact of a Content Adaptive Optimiser for
Compressing 4K HDR Content With AV1
},
author = {Vibhoothi, Vibhoothi and Katsenou, Angeliki and Piti\'{e}, Fran\c{c}ois and
Domijan, Katarina and Kokaram, Anil
},
year = {2023},
booktitle = {2023 IEEE International Conference on Image Processing (ICIP)},
pages = {2610--2614},
doi = {10.1109/icip49359.2023.10222332},
keywords = {Measurement;Protocols;Image coding;Rate-distortion;Streaming media;Quality
assessment;Quality of experience;HDR;AV1;Rate-Distortion
optimisation;Subjective study;Quality metrics
}
} 2022
An empirical approach for estimating the effect of a transcoding aware preprocessor
Varoun Hanooman, Yeping Su, Neil Birkbeck, Balu Adsumilli, Anil Kokaram
Applications of Digital Image Processing XLV , vol. 12226 , pp. 1222613
@inproceedings{Hanooman2022,
title = {An empirical approach for estimating the effect of a transcoding aware
preprocessor
},
author = {Varoun Hanooman and Yeping Su and Neil Birkbeck and Balu Adsumilli and Anil
Kokaram
},
year = {2022},
booktitle = {Applications of Digital Image Processing XLV},
publisher = {Spie},
volume = {12226},
pages = {1222613},
doi = {10.1117/12.2633578},
url = {https://doi.org/10.1117/12.2633578},
editor = {Andrew G. Tescher and Touradj Ebrahimi},
organization = {International Society for Optics and Photonics},
keywords = {video compression, preprocessing, Denoising, transcoding, AV1, VP9, ,}
} Learnable Acoustic Frontends in Bird Activity Detection
Mark Anderson, Naomi Harte
2022 International Workshop on Acoustic Signal Enhancement (IWAENC) , pp. 1--5
@inproceedings{Anderson2022,
title = {Learnable Acoustic Frontends in Bird Activity Detection},
author = {Anderson, Mark and Harte, Naomi},
year = {2022},
booktitle = {2022 International Workshop on Acoustic Signal Enhancement (IWAENC)},
pages = {1--5},
doi = {10.1109/iwaenc53105.2022.9914694}
} Assessing Advances in Real Noise Image Denoisers
Clement Bled, Francois Pitie
Proceedings of the 19th ACM SIGGRAPH European Conference on Visual Media Production
@inproceedings{Bled2022,
title = {Assessing Advances in Real Noise Image Denoisers},
author = {Bled, Clement and Pitie, Francois},
year = {2022},
booktitle = {Proceedings of the 19th ACM SIGGRAPH European Conference on Visual Media
Production
},
location = {London, United Kingdom},
publisher = {Association for Computing Machinery},
address = {New York, NY, USA},
series = {Cvmp '22},
doi = {10.1145/3565516.3565524},
isbn = {9781450399395},
url = {https://doi.org/10.1145/3565516.3565524},
articleno = {8},
numpages = {9},
keywords = {Image denoising, neural networks, real noise}
} An Empirical Approach for Optimising the Impact of a Preprocessor in a Transcoding Pipeline
Varoun Hanooman, Anil C. Kokaram, Yeping Su, Birkbeck, Neil and Adsumili, Balu
2022 IEEE International Conference on Image Processing (ICIP) , pp. 2201--2205
@inproceedings{Hanooman2022,
title = {An Empirical Approach for Optimising the Impact of a Preprocessor in a
Transcoding Pipeline
},
author = {Hanooman, Varoun and Kokaram, Anil C. and Su, Yeping and Birkbeck, Neil and
Adsumili, Balu
},
year = {2022},
booktitle = {2022 IEEE International Conference on Image Processing (ICIP)},
pages = {2201--2205},
doi = {10.1109/icip46576.2022.9897611},
keywords = {Measurement;Pandemics;Image processing;Bit rate;Pipelines;User-generated
content;Data
preprocessing;preprocessor;denoising;codec;transcoding;compression
}
} Robo-Identity: Exploring Artificial Identity and Emotion via Speech Interactions
Guy Laban, Sebastien Le Maguer, Minha Lee, Dimosthenis Kontogiorgos, Samantha Reig et al.
Proceedings of the ACM/IEEE International Conference on Human-Robot Interaction , pp. 1265–1268
@inproceedings{Laban2022,
title = {Robo-Identity: Exploring Artificial Identity and Emotion via Speech
Interactions
},
author = {Laban, Guy and {Le Maguer}, Sebastien and Lee, Minha and Kontogiorgos,
Dimosthenis and Reig, Samantha and Torre, Ilaria and Tejwani, Ravi and
Dennis, Matthew J. and Pereira, Andre
},
year = {2022},
booktitle = {Proceedings of the ACM/IEEE International Conference on Human-Robot
Interaction
},
location = {Sapporo, Hokkaido, Japan},
publisher = {IEEE Press},
series = {Hri '22},
pages = {1265–1268},
numpages = {4},
keywords = {affective science, affective computing, human-robot interaction, voice,
emotion, speech, artificial identity
}
} Back to the Future: Extending the Blizzard Challenge 2013
Sébastien Le Maguer, Simon King, Naomi Harte
Proceedings of Interspeech , pp. 2378--2382
@inproceedings{Maguer2022,
title = {Back to the Future: Extending the Blizzard Challenge 2013},
author = {S\'{e}bastien {Le Maguer} and Simon King and Naomi Harte},
year = {2022},
booktitle = {Proceedings of Interspeech},
pages = {2378--2382},
doi = {10.21437/Interspeech.2022-10633}
} Production characteristics of obstruents in WaveNet and older TTS systems
Ayushi Pandey, Sébastien Le Maguer, Julie Carson-Berndsen and Naomi Harte
Proceedings of Interspeech , pp. 2373--2377
@inproceedings{Pandey2022,
title = {Production characteristics of obstruents in WaveNet and older TTS systems},
author = {Ayushi Pandey and S\'{e}bastien {Le Maguer} and Julie Carson-Berndsen and
Naomi Harte
},
year = {2022},
booktitle = {Proceedings of Interspeech},
pages = {2373--2377},
doi = {10.21437/Interspeech.2022-10606}
} A Deep Learning post-processor with a perceptual loss function for video compression artifact removal
D. Ramsook, A. Kokaram, N. Birkbeck, Y. Su, B. Adsumilli
2022 Picture Coding Symposium (PCS) , pp. 85--89
@inproceedings{Ramsook2022a,
title = {A Deep Learning post-processor with a perceptual loss function for video
compression artifact removal
},
author = {Ramsook, D. and Kokaram, A. and Birkbeck, N. and Su, Y. and Adsumilli, B.},
year = {2022},
booktitle = {2022 Picture Coding Symposium (PCS)},
pages = {85--89},
doi = {10.1109/pcs56426.2022.10018047},
keywords = {Deep learning;Training;Neural networks;Bit rate;Video compression;Streaming
media;Encoding;Perceptually Motivated Restoration;Artifact Removal;Video
Restoration
}
} Perceptually motivated deep neural network for video compression artifact removal
Darren Ramsook, Anil Kokaram, Neil Birkbeck, Yeping Su, Balu Adsumilli
Applications of Digital Image Processing XLV , vol. 12226 , pp. 122260h
@inproceedings{Ramsook2022b,
title = {Perceptually motivated deep neural network for video compression artifact
removal
},
author = {Darren Ramsook and Anil Kokaram and Neil Birkbeck and Yeping Su and Balu
Adsumilli
},
year = {2022},
booktitle = {Applications of Digital Image Processing XLV},
publisher = {Spie},
volume = {12226},
pages = {122260h},
doi = {10.1117/12.2633552},
url = {https://doi.org/10.1117/12.2633552},
editor = {Andrew G. Tescher and Touradj Ebrahimi},
organization = {International Society for Optics and Photonics},
keywords = {Video Artefact Removal, Perceptually Motivated Video Artefact Removal,
Perceptual Loss Function
}
} Automating sports broadcasting using ultra-high definition cameras, neural networks, and classical denoising
Sophia Rosney, Ciarán Donegan, Meegan Gower, Wissam Jassim and Hugh Denman, Donal Scannell et al.
Applications of Digital Image Processing XLV , vol. 12226 , pp. 122260y
@inproceedings{Rosney2022,
title = {Automating sports broadcasting using ultra-high definition cameras, neural
networks, and classical denoising
},
author = {Sophia Rosney and Ciar{\'a}n Donegan and Meegan Gower and Wissam Jassim and
Hugh Denman and Donal Scannell and Anil Kokaram
},
year = {2022},
booktitle = {Applications of Digital Image Processing XLV},
publisher = {Spie},
volume = {12226},
pages = {122260y},
doi = {10.1117/12.2633075},
url = {https://doi.org/10.1117/12.2633075},
editor = {Andrew G. Tescher and Touradj Ebrahimi},
organization = {International Society for Optics and Photonics},
keywords = {automated broadcasting, YOLO object detection, virtual production,
denoising, deblurring, ultra high definition, real-time, sports video
}
} Direct optimisation of for HDR content adaptive transcoding in AV1
Vibhoothi, François Pitié, Angeliki Katsenou, Daniel Joseph Ringis, Yeping Su et al.
Applications of Digital Image Processing XLV , vol. 12226 , pp. 36--45
@inproceedings{Vibhoothi2022,
title = {Direct optimisation of $\lambda$ for HDR content adaptive transcoding in
AV1
},
author = {Vibhoothi, and Piti\'{e}, Fran\c{c}ois and Katsenou, Angeliki and Ringis,
Daniel Joseph and Su, Yeping and Birkbeck, Neil and Lin, Jessie and
Adsumilli, Balu and Kokaram, Anil and others
},
year = {2022},
booktitle = {Applications of Digital Image Processing XLV},
volume = {12226},
pages = {36--45},
organization = {Spie}
} 2021
Bioacoustic Event Detection with prototypical networks and data augmentation
Mark Anderson, Naomi Harte
arXiv
@misc{Anderson2021a,
title = {Bioacoustic Event Detection with prototypical networks and data
augmentation
},
author = {Anderson, Mark and Harte, Naomi},
year = {2021},
publisher = {arXiv},
doi = {10.48550/arxiv.2112.09006},
url = {https://arxiv.org/abs/2112.09006},
copyright = {Creative Commons Attribution Share Alike 4.0 International},
keywords = {Audio and Speech Processing (eess.AS), FOS: Electrical engineering,
electronic engineering, information engineering, FOS: Electrical
engineering, electronic engineering, information engineering
}
} Low Resource Species Agnostic Bird Activity Detection
Mark Anderson, John Kennedy, Naomi Harte
2021 IEEE Workshop on Signal Processing Systems (SiPS) , pp. 34--39
@inproceedings{Anderson2021b,
title = {Low Resource Species Agnostic Bird Activity Detection},
author = {Anderson, Mark and Kennedy, John and Harte, Naomi},
year = {2021},
booktitle = {2021 IEEE Workshop on Signal Processing Systems (SiPS)},
pages = {34--39},
doi = {10.1109/SiPS52927.2021.00015}
} An articulatory study of differences and similarities between stuttered disfluencies and non-pathological disfluencies
Ivana Didirková, Sébastien Le Maguer, Fabrice Hirsch
Clinical Linguistics & Phonetics , vol. 35 , no. 3 , pp. 201--221
@article{Didirkov_a2021,
title = {An articulatory study of differences and similarities between stuttered
disfluencies and non-pathological disfluencies
},
author = {Ivana Didirkov\'{a} and S\'{e}bastien {Le Maguer} and Fabrice Hirsch},
year = {2021},
month = {mar},
journal = {Clinical Linguistics {\&} Phonetics},
publisher = {Taylor {\&} Francis},
volume = {35},
number = {3},
pages = {201--221},
doi = {10.1080/02699206.2020.1752803},
issn = {0269-9206}
} Phonetic accommodation in interaction with a virtual language learning tutor: A Wizard-of-Oz study
Iona Gessinger, Bernd Möbius, Sébastien Le Maguer, Eran Raveh, Ingmar Steiner
Journal of Phonetics , vol. 86 , pp. 101029
@article{Gessinger2021,
title = {Phonetic accommodation in interaction with a virtual language learning
tutor: A Wizard-of-Oz study
},
author = {Iona Gessinger and Bernd M{\"o}bius and S\'{e}bastien {Le Maguer} and Eran
Raveh and Ingmar Steiner
},
year = {2021},
month = {may},
journal = {Journal of Phonetics},
publisher = {Academic Press},
volume = {86},
pages = {101029},
doi = {10.1016/j.wocn.2021.101029},
issn = {0095-4470},
pdf = {https://www.sciencedirect.com/science/article/pii/S0095447021000012/pdfft?isDTMRedir=true&download=true
}
} Synthesizing a Human-like Voice is the Easy Way
Sébastien Le Maguer, Benjamin R. Cowan
CUI 2021 - 3rd Conference on Conversational User Interfaces
@inproceedings{Le_Maguer2021,
title = {Synthesizing a Human-like Voice is the Easy Way},
author = {{Le Maguer}, S\'{e}bastien and Cowan, Benjamin R.},
year = {2021},
booktitle = {CUI 2021 - 3rd Conference on Conversational User Interfaces},
location = {Bilbao (online), Spain},
publisher = {Association for Computing Machinery},
address = {New York, NY, USA},
series = {Cui '21},
doi = {10.1145/3469595.3469614},
isbn = {9781450389983},
pdf = {https://dl.acm.org/doi/pdf/10.1145/3469595.3469614},
articleno = {19},
numpages = {3},
keywords = {human-like/non-human-like sounding voice, Speech synthesis}
} Will synthetic speech provide a suitable voice for robots?
Sébastien Le Maguer
Robo-Identity: Artificial identity and multi-embodiment
@inproceedings{Maguer2021,
title = {Will synthetic speech provide a suitable voice for robots?},
author = {S\'{e}bastien {Le Maguer}},
year = {2021},
booktitle = {Robo-Identity: Artificial identity and multi-embodiment},
pdf = {https://drive.google.com/file/d/1Lnmoa1M87JVgyRgikq9e60IK3kpr6zbw/view?usp=sharing
}
} Mind your p's and k's -- Comparing obstruents across TTS voices of the Blizzard Challenge 2013
Ayushi Pandey, Sébastien Le Maguer, Julie Berndsen, Naomi Harte
Speech Synthesis Workshop (SSW) , pp. 166--171
@inproceedings{Pandey2021,
title = {Mind your p's and k's -- Comparing obstruents across TTS voices of the
Blizzard Challenge 2013
},
author = {Ayushi Pandey and S\'{e}bastien {Le Maguer} and Julie Berndsen and Naomi
Harte
},
year = {2021},
booktitle = {Speech Synthesis Workshop (SSW)},
pages = {166--171},
doi = {10.21437/ssw.2021-29},
pdf = {https://www.isca-speech.org/archive/pdfs/ssw_2021/pandey21_ssw.pdf}
} CNN-Based Video Codec Classifier For Multimedia Forensics
Rodrigo Pessoa, Anil Kokaram, Francois Pitie, Mark Sugrue
2021 IEEE International Conference on Image Processing (ICIP) , pp. 3033--3037
@inproceedings{Pessoa2021,
title = {CNN-Based Video Codec Classifier For Multimedia Forensics},
author = {Pessoa, Rodrigo and Kokaram, Anil and Pitie, Francois and Sugrue, Mark},
year = {2021},
booktitle = {2021 IEEE International Conference on Image Processing (ICIP)},
pages = {3033--3037},
doi = {10.1109/icip42928.2021.9506020},
keywords = {Forensics;Image processing;Conferences;User-generated content;Streaming
media;Fingerprint recognition;Rendering (computer
graphics);video;forensics;CNN;codec;decoding
}
} A differentiable estimator of VMAF for Video
Darren Ramsook, Anil Kokaram, Noel O'Connor, Birkbeck, Neil and Su, Yeping, Balu Adsumilli
2021 Picture Coding Symposium (PCS) , pp. 1--5
@inproceedings{Ramsook2021a,
title = {A differentiable estimator of VMAF for Video},
author = {Ramsook, Darren and Kokaram, Anil and O'Connor, Noel and Birkbeck, Neil and
Su, Yeping and Adsumilli, Balu
},
year = {2021},
booktitle = {2021 Picture Coding Symposium (PCS)},
pages = {1--5},
doi = {10.1109/pcs50896.2021.9477480},
keywords = {Measurement;Training;Visualization;Image coding;Training data;Feature
extraction;Encoding;Perceptual Visual Quality;Video Quality;Deep Neural
Network
}
} A differentiable VMAF proxy as a loss function for video noise reduction
Darren Ramsook, Anil Kokaram, Noel O'Connor, Neil Birkbeck and Yeping Su, Balu Adsumilli
Applications of Digital Image Processing XLIV , vol. 11842 , pp. 118420x
@inproceedings{Ramsook2021b,
title = {A differentiable VMAF proxy as a loss function for video noise reduction},
author = {Darren Ramsook and Anil Kokaram and Noel O'Connor and Neil Birkbeck and
Yeping Su and Balu Adsumilli
},
year = {2021},
booktitle = {Applications of Digital Image Processing XLIV},
publisher = {Spie},
volume = {11842},
pages = {118420x},
doi = {10.1117/12.2594164},
url = {https://doi.org/10.1117/12.2594164},
editor = {Andrew G. Tescher and Touradj Ebrahimi},
organization = {International Society for Optics and Photonics},
keywords = {HVS loss function, Perceptually Motivated Video Restoration, Video
Restoration
}
} Near optimal per-clip lagrangian multiplier prediction in hevc
Daniel J Ringis, François Pitié, Anil Kokaram
2021 Picture Coding Symposium (PCS) , pp. 1--5
@inproceedings{Ringis2021a,
title = {Near optimal per-clip lagrangian multiplier prediction in hevc},
author = {Ringis, Daniel J and Piti\'{e}, Fran\c{c}ois and Kokaram, Anil},
year = {2021},
booktitle = {2021 Picture Coding Symposium (PCS)},
pages = {1--5},
organization = {Ieee}
} Per-clip and per-bitrate adaptation of the Lagrangian multiplier in video coding
Daniel J Ringis, Francois Pitie, Anil Kokaram
Applications of Digital Image Processing XLIV , vol. 11842 , pp. 118420o
@inproceedings{Ringis2021b,
title = {Per-clip and per-bitrate adaptation of the Lagrangian multiplier in video
coding
},
author = {Ringis, Daniel J and Pitie, Francois and Kokaram, Anil},
year = {2021},
booktitle = {Applications of Digital Image Processing XLIV},
volume = {11842},
pages = {118420o},
organization = {International Society for Optics and Photonics}
} Liaison and Pronunciation Learning in End-to-End Text-to-Speech in French
Jason Taylor, Sébastien Le Maguer, Korin Richmond
Speech Synthesis Workshop (SSW) , pp. 195--199
@inproceedings{Taylor2021,
title = {Liaison and Pronunciation Learning in End-to-End Text-to-Speech in French},
author = {Jason Taylor and S\'{e}bastien {Le Maguer} and Korin Richmond},
year = {2021},
booktitle = {Speech Synthesis Workshop (SSW)},
pages = {195--199},
doi = {10.21437/ssw.2021-34},
pdf = {https://www.isca-speech.org/archive/pdfs/ssw_2021/taylor21_ssw.pdf}
} 2020
FlexEval, création de sites web légers pour des campagnes de tests perceptifs multimédias
Cédric Fayet, Alexis Blond, Grégoire Coulombel, Claude Simon, Damien Lolive et al.
Proceedings of JEP, TALN and RECITAL , pp. 22--25
@inproceedings{Fayet2020,
title = {FlexEval, cr\'{e}ation de sites web l\'{e}gers pour des campagnes de tests
perceptifs multim\'{e}dias
},
author = {C\'{e}dric Fayet and Alexis Blond and Gr\'{e}goire Coulombel and Claude
Simon and Damien Lolive and Gw\'{e}nol\'{e} Lecorv\'{e} and Jonathan
Chevelu and S\'{e}bastien {Le Maguer}
},
year = {2020},
booktitle = {Proceedings of JEP, TALN and RECITAL},
address = {Nancy, France},
pages = {22--25},
url = {https://hal.archives-ouvertes.fr/hal-02768500},
pdf = {https://hal.archives-ouvertes.fr/hal-02768500v4/document}
} A Bayesian View of Frame Interpolation and a Comparison with Existing Motion Picture Effects Tools
Anil Kokaram, Davinder Singh, Simon Robinson
2020 IEEE International Conference on Image Processing (ICIP) , pp. 553--557
@inproceedings{Kokaram2020,
title = {A Bayesian View of Frame Interpolation and a Comparison with Existing
Motion Picture Effects Tools
},
author = {Kokaram, Anil and Singh, Davinder and Robinson, Simon},
year = {2020},
booktitle = {2020 IEEE International Conference on Image Processing (ICIP)},
pages = {553--557},
doi = {10.1109/icip40778.2020.9191152},
keywords = {Interpolation;Motion pictures;Optical imaging;Estimation;Image
reconstruction;Bayes methods;Motion estimation;Motion interpolation;Frame
interpolation;motion estimation
}
} Can Auditory Nerve models tell us what's different about WaveNet vocoded speech?
Sébastien Le Maguer, Naomi Harte
Conference of the International Speech Communication Association (Interspeech)
@inproceedings{Maguer2020a,
title = {Can Auditory Nerve models tell us what's different about WaveNet vocoded
speech?
},
author = {S\'{e}bastien {Le Maguer} and Naomi Harte},
year = {2020},
booktitle = {Conference of the International Speech Communication Association
(Interspeech)
},
pdf = {https://www.isca-speech.org/archive/Interspeech_2020/pdfs/2596.pdf}
} Investigation of Auditory Nerve Model Based Analysis for Vocoded Speech Synthesis
Sébastien Le Maguer, Naomi Harte
International Conference on Quality of Multimedia Experience (QoMEX) , pp. 1--6
@inproceedings{Maguer2020b,
title = {Investigation of Auditory Nerve Model Based Analysis for Vocoded Speech
Synthesis
},
author = {S\'{e}bastien {Le Maguer} and Naomi Harte},
year = {2020},
month = {may},
booktitle = {International Conference on Quality of Multimedia Experience (QoMEX)},
publisher = {Ieee},
pages = {1--6},
doi = {10.1109/QoMEX48832.2020.9123101},
issn = {2472-7814}
} Per-clip adaptive Lagrangian multiplier optimisation with low-resolution proxies
Daniel J Ringis, François Pitié, Anil Kokaram
Applications of Digital Image Processing XLIII , vol. 11510 , pp. 115100e
@inproceedings{Ringis2020a,
title = {Per-clip adaptive Lagrangian multiplier optimisation with low-resolution
proxies
},
author = {Ringis, Daniel J and Piti\'{e}, Fran\c{c}ois and Kokaram, Anil},
year = {2020},
booktitle = {Applications of Digital Image Processing XLIII},
volume = {11510},
pages = {115100e},
organization = {International Society for Optics and Photonics}
} Per Clip Lagrangian Multiplier Optimisation for HEVC
Daniel J Ringis, François Pitié, Anil Kokaram
Electronic Imaging , vol. 2020 , no. 10 , pp. 136--1
@article{Ringis2020b,
title = {Per Clip Lagrangian Multiplier Optimisation for HEVC},
author = {Ringis, Daniel J and Piti\'{e}, Fran\c{c}ois and Kokaram, Anil},
year = {2020},
journal = {Electronic Imaging},
publisher = {Society for Imaging Science and Technology},
volume = {2020},
number = {10},
pages = {136--1}
} Introducing Prosodic Speaker Identity for a Better Expressive Speech Synthesis Control
Aghilas Sini, Sébastien Le Maguer, Damien Lolive, Elisabeth Delais-Roussarie
Speech Prosody , pp. 935--939
@inproceedings{Sini2020,
title = {Introducing Prosodic Speaker Identity for a Better Expressive Speech
Synthesis Control
},
author = {Aghilas Sini and S\'{e}bastien {Le Maguer} and Damien Lolive and Elisabeth
Delais-Roussarie
},
year = {2020},
booktitle = {Speech Prosody},
address = {Tokyo (Japan)},
pages = {935--939},
doi = {10.21437/SpeechProsody.2020-191},
url = {https://www.isca-speech.org/archive/SpeechProsody_2020/pdfs/75.pdf}
} Should robots have accents?
Ilaria Torre, Sébastien Le Maguer
International Conference on Robot & Human Interactive Communication (RO-MAN) , pp. 208--214
@inproceedings{Torre2020,
title = {Should robots have accents?},
author = {Ilaria Torre and S\'{e}bastien {Le Maguer}},
year = {2020},
booktitle = {International Conference on Robot \& Human Interactive Communication
(RO-MAN)
},
pages = {208--214},
doi = {10.1109/ro-man47096.2020.9223599},
pdf = {http://kth.diva-portal.org/smash/get/diva2:1474825/FULLTEXT01.pdf}
} ASVspoof 2019: A large-scale public database of synthesized, converted and replayed speech
Xin Wang, Junichi Yamagishi, Massimiliano Todisco, Héctor Delgado, Andreas Nautsch et al.
Computer Speech and Language , vol. 64 , pp. 101--114
@article{Wang2020,
title = {ASVspoof 2019: A large-scale public database of synthesized, converted and
replayed speech
},
author = {Xin Wang and Junichi Yamagishi and Massimiliano Todisco and H\'{e}ctor
Delgado and Andreas Nautsch and Nicholas Evans and Md Sahidullah and Ville
Vestman and Tomi Kinnunen and Kong Aik Lee and Lauri Juvela and Paavo Alku
and Yu-Huai Peng and Hsin-Te Hwang and Yu Tsao and Hsin-Min Wang and
S\'{e}bastien {Le Maguer} and Markus Becker and Fergus Henderson and Rob
Clark and Yu Zhang and Quan Wang and Ye Jia and Kai Onuma and Koji Mushika
and Takashi Kaneda and Yuan Jiang and Li-Juan Liu and Yi-Chiao Wu and
Wen-Chin Huang and Tomoki Toda and Kou Tanaka and Hirokazu Kameoka and
Ingmar Steiner and Driss Matrouf and Jean-Fran\c{c}ois Bonastre and Avashna
Govender and Srikanth Ronanki and Jing-Xuan Zhang and Zhen-Hua Ling
},
year = {2020},
month = {nov},
journal = {Computer Speech and Language},
publisher = {Academic Press},
volume = {64},
pages = {101--114},
doi = {10.1016/j.csl.2020.101114},
issn = {0885-2308}
} 2019
A Low-Complexity Mosaicing Algorithm for Stock Assessment of Seabed-Burrowing Species
David Corrigan, Ken Sooknanan, Jennifer Doyle, Colm Lordan and Anil Kokaram
IEEE Journal of Oceanic Engineering , vol. 44 , no. 2 , pp. 386--400
@article{Corrigan2019,
title = {A Low-Complexity Mosaicing Algorithm for Stock Assessment of
Seabed-Burrowing Species
},
author = {David Corrigan and Ken Sooknanan and Jennifer Doyle and Colm Lordan and
Anil Kokaram
},
year = {2019},
month = {apr},
journal = {IEEE Journal of Oceanic Engineering},
publisher = {Institute of Electrical and Electronics Engineers ({IEEE})},
volume = {44},
number = {2},
pages = {386--400},
doi = {10.1109/joe.2018.2808973},
url = {https://doi.org/10.1109/joe.2018.2808973}
} An Advert Creation System for Next-Gen Publicity
Atul Nautiyal, Killian McCabe, Murhaf Hossari, Soumyabrata Dev and Matthew Nicholson, Clare Conran et al.
Machine Learning and Knowledge Discovery in Databases , pp. 663--667
@incollection{Nautiyal2019,
title = {An Advert Creation System for Next-Gen Publicity},
author = {Atul Nautiyal and Killian McCabe and Murhaf Hossari and Soumyabrata Dev and
Matthew Nicholson and Clare Conran and Declan McKibben and Jian Tang and
Wei Xu and Fran\c{c}ois Piti\'{e}
},
year = {2019},
month = {aug},
booktitle = {Machine Learning and Knowledge Discovery in Databases},
publisher = {Springer International Publishing},
pages = {663--667},
doi = {10.1007/978-3-030-10997-4_47},
url = {https://doi.org/10.1007/978-3-030-10997-4_47},
urldate = {2018-12-12},
note = {arXiv: 1808.00163},
file = {arXiv\:1808.00163 PDF:/Users/fpitie/Zotero/storage/B2HTTF6A/Nautiyal et al.
- 2018 - An Advert Creation System for Next-Gen
Publicity.pdf:application/pdf;arXiv.org
Snapshot:/Users/fpitie/Zotero/storage/FHCU6LVG/1808.html:text/html
}
} Shot boundary detection based on orthogonal polynomial
Sadiq H. Abdulhussain, Abd Rahman Ramli, Basheera M. Mahmmod, M. Iqbal Saripan, Syed Abdul Rahman Al-Haddad et al.
Multimed Tools Appl , vol. 78 , no. 14 , pp. 20361--20382
@article{Abdulhussain2019,
title = {Shot boundary detection based on orthogonal polynomial},
author = {Sadiq H. Abdulhussain and Abd Rahman Ramli and Basheera M. Mahmmod and M.
Iqbal Saripan and Syed Abdul Rahman Al-Haddad and Wissam A. Jassim
},
year = {2019},
month = {feb},
journal = {Multimed Tools Appl},
publisher = {Springer Science and Business Media {LLC}},
volume = {78},
number = {14},
pages = {20361--20382},
doi = {10.1007/s11042-019-7364-3},
url = {https://doi.org/10.1007/s11042-019-7364-3}
} Articulatory behaviour during disfluencies in stuttered speech
Ivana Didirková, Sébastien Le Maguer, Fabrice Hirsch and Dodji Gbedahou
Proceedings of the International Congress of Phonetic Science (ICPhS)
@inproceedings{Didirkov_a2019,
title = {Articulatory behaviour during disfluencies in stuttered speech},
author = {Ivana Didirkov\'{a} and S\'{e}bastien {Le Maguer} and Fabrice Hirsch and
Dodji Gbedahou
},
year = {2019},
booktitle = {Proceedings of the International Congress of Phonetic Science (ICPhS)}
} Solar Flare Forecasting from Magnetic Feature Properties Generated by the Solar Monitor Active Region Tracker
Katarina Domijan, D. Shaun Bloomfield, François Pitié
Solar Physics , vol. 294 , no. 1
@article{Domijan2019,
title = {Solar Flare Forecasting from Magnetic Feature Properties Generated by the
Solar Monitor Active Region Tracker
},
author = {Katarina Domijan and D. Shaun Bloomfield and Fran\c{c}ois Piti\'{e}},
year = {2019},
month = {jan},
journal = {Solar Physics},
publisher = {Springer Science and Business Media {LLC}},
volume = {294},
number = {1},
doi = {10.1007/s11207-018-1392-4},
url = {https://doi.org/10.1007/s11207-018-1392-4}
} NSQM: A non-intrusive assessment of speech quality using normalized energies of the neurogram
Wissam A. Jassim, Muhammad S. A. Zilany
Computer Speech $&$ Language , vol. 58 , pp. 260--279
@article{Jassim2019,
title = {{NSQM}: A non-intrusive assessment of speech quality using normalized
energies of the neurogram
},
author = {Wissam A. Jassim and Muhammad S. A. Zilany},
year = {2019},
month = {nov},
journal = {Computer Speech $\&$ Language},
publisher = {Elsevier {BV}},
volume = {58},
pages = {260--279},
doi = {10.1016/j.csl.2019.04.005},
url = {https://doi.org/10.1016/j.csl.2019.04.005}
} Speech Enhancement Algorithm Based on Super-Gaussian Modeling and Orthogonal Polynomials
Basheera M. Mahmmod, Abd Rahman Ramli, Thar Baker, Feras Al-Obeidat, Sadiq H. Abdulhussain et al.
IEEE Access , vol. 7 , pp. 103485--103504
@article{Mahmmod2019,
title = {Speech Enhancement Algorithm Based on Super-Gaussian Modeling and
Orthogonal Polynomials
},
author = {Basheera M. Mahmmod and Abd Rahman Ramli and Thar Baker and Feras
Al-Obeidat and Sadiq H. Abdulhussain and Wissam A. Jassim
},
year = {2019},
journal = {IEEE Access},
publisher = {Institute of Electrical and Electronics Engineers ({IEEE})},
volume = {7},
pages = {103485--103504},
doi = {10.1109/access.2019.2929864},
url = {https://doi.org/10.1109/access.2019.2929864}
} Speech Synthesis Evaluation - State-of-the-Art Assessment and Suggestion for a Novel Research Program
Petra Wagner, Jonas Beskow, Simon Betz, Jens Edlund, Joakim Gustafson et al.
10th ISCA Speech Synthesis Workshop
@inproceedings{Wagner2019,
title = {Speech Synthesis Evaluation - State-of-the-Art Assessment and Suggestion
for a Novel Research Program
},
author = {Petra Wagner and Jonas Beskow and Simon Betz and Jens Edlund and Joakim
Gustafson and Gustav Eje Henter and S\'{e}bastien {Le Maguer} and Zofia
Malisz and {\'{E}}va Sz\'{e}kely and Christina T{\aa}nnander and Jana
Vo{\ss}e
},
year = {2019},
month = {sep},
booktitle = {10th {ISCA} Speech Synthesis Workshop},
publisher = {Isca},
doi = {10.21437/ssw.2019-19},
url = {https://doi.org/10.21437/ssw.2019-19}
} 2018
A New Hybrid form of Krawtchouk and Tchebichef Polynomials: Design and Application
Sadiq H. Abdulhussain, Abd Rahman Ramli, Basheera M. Mahmmod, M. Iqbal Saripan, Syed Abdul Rahman Al-Haddad et al.
J Math Imaging Vis , vol. 61 , no. 4 , pp. 555--570
@article{Abdulhussain2018a,
title = {A New Hybrid form of Krawtchouk and Tchebichef Polynomials: Design and
Application
},
author = {Sadiq H. Abdulhussain and Abd Rahman Ramli and Basheera M. Mahmmod and M.
Iqbal Saripan and Syed Abdul Rahman Al-Haddad and Wissam A. Jassim
},
year = {2018},
month = {nov},
journal = {J Math Imaging Vis},
publisher = {Springer Science and Business Media {LLC}},
volume = {61},
number = {4},
pages = {555--570},
doi = {10.1007/s10851-018-0863-4},
url = {https://doi.org/10.1007/s10851-018-0863-4}
} Methods and Challenges in Shot Boundary Detection: A Review
Sadiq H. Abdulhussain, Abd Ramli, M. Saripan, Basheera Mahmmod and Syed Abdul Rahman Al-Haddad, Wissam Jassim
Entropy , vol. 20 , no. 4 , pp. 214
@article{Abdulhussain2018b,
title = {Methods and Challenges in Shot Boundary Detection: A Review},
author = {Sadiq H. Abdulhussain and Abd Ramli and M. Saripan and Basheera Mahmmod and
Syed Abdul Rahman Al-Haddad and Wissam Jassim
},
year = {2018},
month = {mar},
journal = {Entropy},
publisher = {{Mdpi} {Ag}},
volume = {20},
number = {4},
pages = {214},
doi = {10.3390/e20040214},
url = {https://doi.org/10.3390/e20040214}
} Radon transform of auditory neurograms: a robust feature set for phoneme classification
Md. Shariful Alam, Wissam A. Jassim, Muhammad S. A. Zilany
IET Signal Processing , vol. 12 , no. 3 , pp. 260--268
@article{Alam2018,
title = {Radon transform of auditory neurograms: a robust feature set for phoneme
classification
},
author = {Md. Shariful Alam and Wissam A. Jassim and Muhammad S. A. Zilany},
year = {2018},
month = {may},
journal = {IET Signal Processing},
publisher = {Institution of Engineering and Technology ({IET})},
volume = {12},
number = {3},
pages = {260--268},
doi = {10.1049/iet-spr.2017.0170},
url = {https://doi.org/10.1049/iet-spr.2017.0170}
} Neural net architectures for image demosaicing
Rhys Buggy, Marco Forte, François Pitié
Applications of Digital Image Processing XLI
@inproceedings{Buggy2018,
title = {Neural net architectures for image demosaicing},
author = {Rhys Buggy and Marco Forte and Fran\c{c}ois Piti\'{e}},
year = {2018},
month = {sep},
booktitle = {Applications of Digital Image Processing {XLI}},
publisher = {Spie},
doi = {10.1117/12.2322353},
url = {https://doi.org/10.1117/12.2322353},
editor = {Andrew G. Tescher}
} Estimation of the Asymmetry Parameter of the Glottal Flow Waveform Using the Electroglottographic Signal
João Cabral
Interspeech 2018
@inproceedings{Cabral2018,
title = {Estimation of the Asymmetry Parameter of the Glottal Flow Waveform Using
the Electroglottographic Signal
},
author = {Jo\~{a}o Cabral},
year = {2018},
month = {sep},
booktitle = {Interspeech 2018},
publisher = {Isca},
doi = {10.21437/interspeech.2018-2371},
url = {https://doi.org/10.21437/interspeech.2018-2371}
} Perception and prediction of speaker appeal - A single speaker study
Ailbhe Cullen, Andrew Hines, Naomi Harte
Computer Speech $&$ Language , vol. 52 , pp. 23--40
@article{Cullen2018,
title = {Perception and prediction of speaker appeal - A single speaker study},
author = {Ailbhe Cullen and Andrew Hines and Naomi Harte},
year = {2018},
month = {nov},
journal = {Computer Speech $\&$ Language},
publisher = {Elsevier {BV}},
volume = {52},
pages = {23--40},
doi = {10.1016/j.csl.2018.04.004},
url = {https://doi.org/10.1016/j.csl.2018.04.004}
} The Impact of Reduced Video Quality on Visual Speech Recognition
Laura Dungan, Ali Karaali, Naomi Harte
2018 25th IEEE International Conference on Image Processing (ICIP)
@inproceedings{Dungan2018,
title = {The Impact of Reduced Video Quality on Visual Speech Recognition},
author = {Laura Dungan and Ali Karaali and Naomi Harte},
year = {2018},
month = {oct},
booktitle = {2018 25th {IEEE} International Conference on Image Processing ({ICIP})},
publisher = {Ieee},
doi = {10.1109/icip.2018.8451754},
url = {https://doi.org/10.1109/icip.2018.8451754}
} ADNet: A Deep Network for Detecting Adverts
Murhaf Hossari, Soumyabrata Dev, Matthew Nicholson, Killian McCabe, Atul Nautiyal et al.
@inproceedings{Hossari2018,
title = {ADNet: A Deep Network for Detecting Adverts},
author = {Murhaf Hossari and Soumyabrata Dev and Matthew Nicholson and Killian McCabe
and Atul Nautiyal and Clare Conran and Jian Tang and Wei Xu and
Fran\c{c}ois Piti\'{e}
},
year = {2018},
month = {dec},
url = {http://arxiv.org/abs/1811.04115},
urldate = {2018-12-12},
copyright = {All rights reserved},
note = {arXiv: 1811.04115},
keywords = {Computer Science - Machine Learning, Computer Science - Multimedia},
pdf = {arXiv\:1811.04115 PDF:/Users/fpitie/Zotero/storage/2WKYYP5B/Hossari et al.
- 2018 - ADNet A Deep Network for Detecting
Adverts.pdf:application/pdf;arXiv.org
Snapshot:/Users/fpitie/Zotero/storage/UGD4669L/1811.html:text/html
}
} Voice Activity Detection Using Neurograms
Wissam A. Jassim, Naomi Harte
2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)
@inproceedings{Jassim2018,
title = {Voice Activity Detection Using Neurograms},
author = {Wissam A. Jassim and Naomi Harte},
year = {2018},
month = {apr},
booktitle = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
Processing ({ICASSP})
},
publisher = {Ieee},
doi = {10.1109/icassp.2018.8461952},
url = {https://doi.org/10.1109/icassp.2018.8461952}
} Edge-Based Defocus Blur Estimation With Adaptive Scale Selection
Ali Karaali, Claudio Rosito Jung
IEEE Transactions on Image Processing , vol. 27 , no. 3 , pp. 1126--1137
@article{Karaali2018a,
title = {Edge-Based Defocus Blur Estimation With Adaptive Scale Selection},
author = {Ali Karaali and Claudio Rosito Jung},
year = {2018},
month = {mar},
journal = {IEEE Transactions on Image Processing},
publisher = {Institute of Electrical and Electronics Engineers ({IEEE})},
volume = {27},
number = {3},
pages = {1126--1137},
doi = {10.1109/tip.2017.2771563},
url = {https://doi.org/10.1109/tip.2017.2771563}
} Temporal Consistency for Still Image Based Defocus Blur Estimation Methods
Ali Karaali, Claudio Rosito Jung, François Pitié
2018 25th IEEE International Conference on Image Processing (ICIP)
@inproceedings{Karaali2018b,
title = {Temporal Consistency for Still Image Based Defocus Blur Estimation Methods},
author = {Ali Karaali and Claudio Rosito Jung and Fran\c{c}ois Piti\'{e}},
year = {2018},
month = {oct},
booktitle = {2018 25th {IEEE} International Conference on Image Processing ({ICIP})},
publisher = {Ieee},
doi = {10.1109/icip.2018.8451778},
url = {https://doi.org/10.1109/icip.2018.8451778}
} Using video quality metrics for something other than compression
Anil Kokaram, Chao Chen, Yilin Wang, Jessie Lin, Balu Adsumilli et al.
Applications of Digital Image Processing XLI
@inproceedings{Kokaram2018,
title = {Using video quality metrics for something other than compression},
author = {Anil Kokaram and Chao Chen and Yilin Wang and Jessie Lin and Balu Adsumilli
and Steve Benting and Neil Birkbeck and Damien Kelly and Michele Covell and
Sasi Inguva
},
year = {2018},
month = {sep},
booktitle = {Applications of Digital Image Processing {XLI}},
publisher = {Spie},
doi = {10.1117/12.2322506},
url = {https://doi.org/10.1117/12.2322506},
editor = {Andrew G. Tescher}
} Signal compression and enhancement using a new orthogonal-polynomial-based discrete transform
Basheera M. Mahmmod, Abd Rahman bin Ramli, Sadiq H. Abdulhussain and Syed Abdul Rahman Al-Haddad, Wissam A. Jassim
IET Signal Processing , vol. 12 , no. 1 , pp. 129--142
@article{Mahmmod2018,
title = {Signal compression and enhancement using a new orthogonal-polynomial-based
discrete transform
},
author = {Basheera M. Mahmmod and Abd Rahman bin Ramli and Sadiq H. Abdulhussain and
Syed Abdul Rahman Al-Haddad and Wissam A. Jassim
},
year = {2018},
month = {feb},
journal = {IET Signal Processing},
publisher = {Institution of Engineering and Technology ({IET})},
volume = {12},
number = {1},
pages = {129--142},
doi = {10.1049/iet-spr.2016.0449},
url = {https://doi.org/10.1049/iet-spr.2016.0449}
} Acoustic distinctions between speech and singing: Is singing acoustically more stable than speech?
Beatriz Medeiros, João Cabral
9th International Conference on Speech Prosody 2018
@inproceedings{Medeiros2018,
title = {Acoustic distinctions between speech and singing: Is singing acoustically
more stable than speech?
},
author = {Beatriz Medeiros and Jo\~{a}o Cabral},
year = {2018},
month = {jun},
booktitle = {9th International Conference on Speech Prosody 2018},
publisher = {Isca},
doi = {10.21437/speechprosody.2018-110},
url = {https://doi.org/10.21437/speechprosody.2018-110}
} Measuring vocal difference in bird population pairs
Colm O'Reilly, Kangkuso Analuddin, David J. Kelly, Naomi Harte
The Journal of the Acoustical Society of America , vol. 143 , no. 3 , pp. 1658--1671
@article{O_Reilly2018,
title = {Measuring vocal difference in bird population pairs},
author = {Colm O'Reilly and Kangkuso Analuddin and David J. Kelly and Naomi Harte},
year = {2018},
month = {mar},
journal = {The Journal of the Acoustical Society of America},
publisher = {Acoustical Society of America ({ASA})},
volume = {143},
number = {3},
pages = {1658--1671},
doi = {10.1121/1.5027244},
url = {https://doi.org/10.1121/1.5027244}
} Using modern motion estimation algorithms in existing video codecs
Daniel Joseph Ringis, Davinder Singh, François Pitié, Anil Kokaram
Applications of Digital Image Processing XLI
@inproceedings{Ringis2018,
title = {Using modern motion estimation algorithms in existing video codecs},
author = {Daniel Joseph Ringis and Davinder Singh and Fran\c{c}ois Piti\'{e} and Anil
Kokaram
},
year = {2018},
month = {sep},
booktitle = {Applications of Digital Image Processing {XLI}},
publisher = {Spie},
doi = {10.1117/12.2322411},
url = {https://doi.org/10.1117/12.2322411},
editor = {Andrew G. Tescher}
} Investigating Speech Features for Continuous Turn-Taking Prediction Using LSTMs
Matthew Roddy, Gabriel Skantze, Naomi Harte
Interspeech 2018
@inproceedings{Roddy2018,
title = {Investigating Speech Features for Continuous Turn-Taking Prediction Using
{LSTMs}
},
author = {Matthew Roddy and Gabriel Skantze and Naomi Harte},
year = {2018},
month = {sep},
booktitle = {Interspeech 2018},
publisher = {Isca},
doi = {10.21437/interspeech.2018-2124},
url = {https://doi.org/10.21437/interspeech.2018-2124}
} Attention-based Audio-Visual Fusion for Robust Automatic Speech Recognition
George Sterpu, Christian Saam, Naomi Harte
Proceedings of the 20th ACM International Conference on Multimodal Interaction
@inproceedings{Sterpu2018a,
title = {Attention-based Audio-Visual Fusion for Robust Automatic Speech Recognition
},
author = {George Sterpu and Christian Saam and Naomi Harte},
year = {2018},
month = {oct},
booktitle = {Proceedings of the 20th {ACM} International Conference on Multimodal
Interaction
},
publisher = {Acm},
doi = {10.1145/3242969.3243014},
url = {https://doi.org/10.1145/3242969.3243014}
} Can DNNs Learn to Lipread Full Sentences?
George Sterpu, Christian Saam, Naomi Harte
2018 25th IEEE International Conference on Image Processing (ICIP)
@inproceedings{Sterpu2018b,
title = {Can {DNNs} Learn to Lipread Full Sentences?},
author = {George Sterpu and Christian Saam and Naomi Harte},
year = {2018},
month = {oct},
booktitle = {2018 25th {IEEE} International Conference on Image Processing ({ICIP})},
publisher = {Ieee},
doi = {10.1109/icip.2018.8451388},
url = {https://doi.org/10.1109/icip.2018.8451388}
} Trust in artificial voices: A "congruency effect" of first impressions and behavioural experience
Ilaria Torre, Jeremy Goslin, Laurence White, Debora Zanatto
Proceedings of the Technology, Mind, and Society
@inproceedings{Torre2018,
title = {Trust in artificial voices: {A} "congruency effect" of first impressions
and behavioural experience
},
author = {Ilaria Torre and Jeremy Goslin and Laurence White and Debora Zanatto},
year = {2018},
month = {apr},
booktitle = {Proceedings of the Technology, Mind, and Society},
publisher = {Acm},
doi = {10.1145/3183654.3183691},
url = {https://doi.org/10.1145/3183654.3183691}
} 2017
Image edge detection operators based on orthogonal polynomials
Sadiq H. Abdulhussain, Abd. Rahman Ramli, Basheera M. Mahmmod and Syed Abdul Rahman Al-Haddad, Wissam A. Jassim
International Journal of Image and Data Fusion , pp. 1--16
@article{Abdulhussain2017a,
title = {Image edge detection operators based on orthogonal polynomials},
author = {Sadiq H. Abdulhussain and Abd. Rahman Ramli and Basheera M. Mahmmod and
Syed Abdul Rahman Al-Haddad and Wissam A. Jassim
},
year = {2017},
month = {may},
journal = {International Journal of Image and Data Fusion},
publisher = {Informa {UK} Limited},
pages = {1--16},
doi = {10.1080/19479832.2017.1326405},
url = {https://doi.org/10.1080/19479832.2017.1326405}
} On Computational Aspects of Tchebichef Polynomials for Higher Polynomial Order
Sadiq H. Abdulhussain, Abd Rahman Ramli, Syed Abdul Rahman Al-Haddad, Basheera M. Mahmmod, Wissam A. Jassim
IEEE Access , vol. 5 , pp. 2470--2478
@article{Abdulhussain2017b,
title = {On Computational Aspects of Tchebichef Polynomials for Higher Polynomial
Order
},
author = {Sadiq H. Abdulhussain and Abd Rahman Ramli and Syed Abdul Rahman Al-Haddad
and Basheera M. Mahmmod and Wissam A. Jassim
},
year = {2017},
journal = {IEEE Access},
publisher = {Institute of Electrical and Electronics Engineers ({IEEE})},
volume = {5},
pages = {2470--2478},
doi = {10.1109/access.2017.2669218},
url = {https://doi.org/10.1109/access.2017.2669218}
} Phoneme Classification Using the Auditory Neurogram
Md. Shariful Alam, Muhammad S. A. Zilany, Wissam A. Jassim, Mohd Yazed Ahmad
IEEE Access , vol. 5 , pp. 633--642
@article{Alam2017,
title = {Phoneme Classification Using the Auditory Neurogram},
author = {Md. Shariful Alam and Muhammad S. A. Zilany and Wissam A. Jassim and Mohd
Yazed Ahmad
},
year = {2017},
journal = {IEEE Access},
publisher = {Institute of Electrical and Electronics Engineers ({IEEE})},
volume = {5},
pages = {633--642},
doi = {10.1109/access.2016.2647229},
url = {https://doi.org/10.1109/access.2016.2647229}
} The Influence of Synthetic Voice on the Evaluation of a Virtual Character
João Cabral, Benjamin R. Cowan, Katja Zibrek, Rachel McDonnell
Interspeech 2017
@inproceedings{Cabral2017,
title = {The Influence of Synthetic Voice on the Evaluation of a Virtual Character},
author = {Jo\~{a}o Cabral and Benjamin R. Cowan and Katja Zibrek and Rachel McDonnell
},
year = {2017},
month = {aug},
booktitle = {Interspeech 2017},
publisher = {Isca},
doi = {10.21437/interspeech.2017-325},
url = {https://doi.org/10.21437/interspeech.2017-325}
} Thin slicing to predict viewer impressions of TED Talks
Ailbhe Cullen, Naomi Harte
The 14th International Conference on Auditory-Visual Speech Processing
@inproceedings{Cullen2017,
title = {Thin slicing to predict viewer impressions of {TED} Talks},
author = {Ailbhe Cullen and Naomi Harte},
year = {2017},
month = {aug},
booktitle = {The 14th International Conference on Auditory-Visual Speech Processing},
publisher = {Isca},
doi = {10.21437/avsp.2017-12},
url = {https://doi.org/10.21437/avsp.2017-12}
} A no-reference video quality predictor for compression and scaling artifacts
Deepti Ghadiyaram, Chao Chen, Sasi Inguva, Anil Kokaram
2017 IEEE International Conference on Image Processing (ICIP)
@inproceedings{Ghadiyaram2017,
title = {A no-reference video quality predictor for compression and scaling
artifacts
},
author = {Deepti Ghadiyaram and Chao Chen and Sasi Inguva and Anil Kokaram},
year = {2017},
month = {sep},
booktitle = {2017 {IEEE} International Conference on Image Processing ({ICIP})},
publisher = {Ieee},
doi = {10.1109/icip.2017.8296922},
url = {https://doi.org/10.1109/icip.2017.8296922}
} A software radio LTE network testbed for video quality of experience experimentation
Ismael Gomez, Paul Sutton, Avishek Nag, Ahmed Selim, Linda Doyle et al.
2017 Ninth International Conference on Quality of Multimedia Experience (QoMEX)
@inproceedings{Gomez2017,
title = {A software radio {LTE} network testbed for video quality of experience
experimentation
},
author = {Ismael Gomez and Paul Sutton and Avishek Nag and Ahmed Selim and Linda
Doyle and Vivek Ramachandran and Anil Kokaram
},
year = {2017},
month = {may},
booktitle = {2017 Ninth International Conference on Quality of Multimedia Experience
({QoMEX})
},
publisher = {Ieee},
doi = {10.1109/qomex.2017.7965667},
url = {https://doi.org/10.1109/qomex.2017.7965667}
} A No-Reference Video Quality Predictor For Compressed Videos
Sasi Inguva, Chao Chen, Anil Kokaram
@article{Inguva2017,
title = {A No-Reference Video Quality Predictor For Compressed Videos},
author = {Sasi Inguva and Chao Chen and Anil Kokaram},
year = {2017}
} Speech emotion classification using combined neurogram and INTERSPEECH 2010 paralinguistic challenge features
Wissam A. Jassim, Raveendran Paramesran, Naomi Harte
IET Signal Processing , vol. 11 , no. 5 , pp. 587--595
@article{Jassim2017,
title = {Speech emotion classification using combined neurogram and {INTERSPEECH}
2010 paralinguistic challenge features
},
author = {Wissam A. Jassim and Raveendran Paramesran and Naomi Harte},
year = {2017},
month = {jul},
journal = {IET Signal Processing},
publisher = {Institution of Engineering and Technology ({IET})},
volume = {11},
number = {5},
pages = {587--595},
doi = {10.1049/iet-spr.2016.0336},
url = {https://doi.org/10.1049/iet-spr.2016.0336}
} Low-Distortion MMSE Speech Enhancement Estimator Based on Laplacian Prior
Basheera M. Mahmmod, Abd Rahman Ramli, Sadiq H. Abdulhussain, Syed Abdul Rahman Al-Haddad, Wissam A. Jassim
IEEE Access , vol. 5 , pp. 9866--9881
@article{Mahmmod2017,
title = {Low-Distortion {MMSE} Speech Enhancement Estimator Based on Laplacian Prior
},
author = {Basheera M. Mahmmod and Abd Rahman Ramli and Sadiq H. Abdulhussain and Syed
Abdul Rahman Al-Haddad and Wissam A. Jassim
},
year = {2017},
journal = {IEEE Access},
publisher = {Institute of Electrical and Electronics Engineers ({IEEE})},
volume = {5},
pages = {9866--9881},
doi = {10.1109/access.2017.2699782},
url = {https://doi.org/10.1109/access.2017.2699782}
} Automatic frequency feature extraction for bird species delimitation
Colm O'Reilly, Munevver Kcokuer, Peter Jancovic, Regan Drennan and Naomi Harte
2017 25th European Signal Processing Conference (EUSIPCO)
@inproceedings{O_Reilly2017a,
title = {Automatic frequency feature extraction for bird species delimitation},
author = {Colm O'Reilly and Munevver Kcokuer and Peter Jancovic and Regan Drennan and
Naomi Harte
},
year = {2017},
month = {aug},
booktitle = {2017 25th European Signal Processing Conference ({EUSIPCO})},
publisher = {Ieee},
doi = {10.23919/eusipco.2017.8081511},
url = {https://doi.org/10.23919/eusipco.2017.8081511}
} Pitch tracking of bird vocalizations and an automated process using YIN-bird
Colm O'Reilly, Naomi Harte
Cogent Biology , vol. 3 , no. 1 , pp. 1322025
@article{O_Reilly2017b,
title = {Pitch tracking of bird vocalizations and an automated process using
{YIN}-bird
},
author = {Colm O'Reilly and Naomi Harte},
year = {2017},
month = {jan},
journal = {Cogent Biology},
publisher = {Informa {UK} Limited},
volume = {3},
number = {1},
pages = {1322025},
doi = {10.1080/23312025.2017.1322025},
url = {https://doi.org/10.1080/23312025.2017.1322025},
editor = {Hynek Burda}
} Detecting conversational gaze aversion using unsupervised learning
Matthew Roddy, Naomi Harte
2017 25th European Signal Processing Conference (EUSIPCO)
@inproceedings{Roddy2017a,
title = {Detecting conversational gaze aversion using unsupervised learning},
author = {Matthew Roddy and Naomi Harte},
year = {2017},
month = {aug},
booktitle = {2017 25th European Signal Processing Conference ({EUSIPCO})},
publisher = {Ieee},
doi = {10.23919/eusipco.2017.8081172},
url = {https://doi.org/10.23919/eusipco.2017.8081172}
} Towards predicting dialog acts from previous speakers non-verbal cues
Matthew Roddy, Naomi Harte
Mmsym
@inproceedings{Roddy2017b,
title = {Towards predicting dialog acts from previous speakers non-verbal cues},
author = {Matthew Roddy and Naomi Harte},
year = {2017},
booktitle = {Mmsym},
pdf = {http://mmsym.org/wp-content/uploads/2017/10/MMSYM2017\_paper5\_RoddyHarte.pdf
}
} Objective Assessment of Perceptual Audio Quality Using ViSQOLAudio
Colm Sloan, Naomi Harte, Damien Kelly, Anil Kokaram, Andrew Hines
IEEE Transactions on Broadcasting , vol. 63 , no. 4 , pp. 693--705
@article{Sloan2017,
title = {Objective Assessment of Perceptual Audio Quality Using {ViSQOLAudio}},
author = {Colm Sloan and Naomi Harte and Damien Kelly and Anil Kokaram and Andrew
Hines
},
year = {2017},
month = {dec},
journal = {IEEE Transactions on Broadcasting},
publisher = {Institute of Electrical and Electronics Engineers ({IEEE})},
volume = {63},
number = {4},
pages = {693--705},
doi = {10.1109/tbc.2017.2704421},
url = {https://doi.org/10.1109/tbc.2017.2704421}
} Towards Lipreading Sentences with Active Appearance Models
George Sterpu, Naomi Harte
The 14th International Conference on Auditory-Visual Speech Processing
@inproceedings{Sterpu2017,
title = {Towards Lipreading Sentences with Active Appearance Models},
author = {George Sterpu and Naomi Harte},
year = {2017},
month = {aug},
booktitle = {The 14th International Conference on Auditory-Visual Speech Processing},
publisher = {Isca},
doi = {10.21437/avsp.2017-14},
url = {https://doi.org/10.21437/avsp.2017-14}
} A longitudinal database of Irish political speech with annotations of speaker ability
Ailbhe Cullen, Naomi Harte
Lang Resources & Evaluation , vol. 52 , no. 2 , pp. 401--432
@article{Cullen2017,
title = {A longitudinal database of Irish political speech with annotations of
speaker ability
},
author = {Ailbhe Cullen and Naomi Harte},
year = {2017},
month = {sep},
journal = {Lang Resources \& Evaluation},
publisher = {Springer Science and Business Media {LLC}},
volume = {52},
number = {2},
pages = {401--432},
doi = {10.1007/s10579-017-9401-z},
url = {https://doi.org/10.1007/s10579-017-9401-z}
} 2016
Anatomy from the outside in: a new on-line surface anatomy guide
Journal of Anatomy , vol. 228 , no. 1 , pp. 24--25
@article{2016,
title = {Anatomy from the outside in: a new on-line surface anatomy guide},
year = {2016},
month = {jan},
journal = {Journal of Anatomy},
volume = {228},
number = {1},
pages = {24--25},
authors = {V.B. Morris and David Corrigan and U. Sealy and Anil Kokaram and M. O'Dea
and T.C. Lee
}
} The ADAPT entry to the Blizzard Challenge 2016
João Cabral, Christian Saam, Eva Vanmassenhove, S. Bradley and Fasih Haider
Proceedings of the Blizzard Challenge 2016 Workshop
@inproceedings{Cabral2016,
title = {The {ADAPT} entry to the Blizzard Challenge 2016},
author = {Jo\~{a}o Cabral and Christian Saam and Eva Vanmassenhove and S. Bradley and
Fasih Haider
},
year = {2016},
booktitle = {Proceedings of the Blizzard Challenge 2016 Workshop},
location = {Cupertino, CA, USA}
} A Perceptual Quality Metric for Videos Distorted by Spatially Correlated Noise
Chao Chen, Mohammad Izadi, Anil Kokaram
Proceedings of the 24th ACM international conference on Multimedia
@inproceedings{Chen2016a,
title = {A Perceptual Quality Metric for Videos Distorted by Spatially Correlated
Noise
},
author = {Chao Chen and Mohammad Izadi and Anil Kokaram},
year = {2016},
month = {oct},
booktitle = {Proceedings of the 24th {ACM} international conference on Multimedia},
publisher = {Acm},
doi = {10.1145/2964284.2964302},
url = {https://doi.org/10.1145/2964284.2964302}
} A Subjective Study for the Design of Multi-resolution ABR Video Streams with the VP9 Codec
Chao Chen, Sasi Inguva, Andrew Rankin, Anil Kokaram
Electronic Imaging , vol. 2016 , no. 2 , pp. 1--5
@article{Chen2016b,
title = {A Subjective Study for the Design of Multi-resolution {ABR} Video Streams
with the {VP}9 Codec
},
author = {Chao Chen and Sasi Inguva and Andrew Rankin and Anil Kokaram},
year = {2016},
month = {feb},
journal = {Electronic Imaging},
publisher = {Society for Imaging Science {\&} Technology},
volume = {2016},
number = {2},
pages = {1--5},
doi = {10.2352/issn.2470-1173.2016.2.vipc-235},
url = {https://doi.org/10.2352/issn.2470-1173.2016.2.vipc-235}
} Optimizing Transcoder Quality Targets Using a Neural Network with an Embedded Bitrate Model
Michele Covell, Martín Arjovsky, Yao-Chung Lin, Anil Kokaram
Electronic Imaging , vol. 2016 , no. 2 , pp. 1--7
@article{Covell2016,
title = {Optimizing Transcoder Quality Targets Using a Neural Network with an
Embedded Bitrate Model
},
author = {Michele Covell and Mart{\'{\i}}n Arjovsky and Yao-Chung Lin and Anil
Kokaram
},
year = {2016},
month = {feb},
journal = {Electronic Imaging},
publisher = {Society for Imaging Science {\&} Technology},
volume = {2016},
number = {2},
pages = {1--7},
doi = {10.2352/issn.2470-1173.2016.2.vipc-237},
url = {https://doi.org/10.2352/issn.2470-1173.2016.2.vipc-237}
} A robust automatic birdsong phrase classification: A template-based approach
Kantapon Kaewtip, Abeer Alwan, Colm O'Reilly, Charles E. Taylor
The Journal of the Acoustical Society of America , vol. 140 , no. 5 , pp. 3691--3701
@article{Kaewtip2016,
title = {A robust automatic birdsong phrase classification: A template-based
approach
},
author = {Kantapon Kaewtip and Abeer Alwan and Colm O'Reilly and Charles E. Taylor},
year = {2016},
month = {nov},
journal = {The Journal of the Acoustical Society of America},
publisher = {Acoustical Society of America ({ASA})},
volume = {140},
number = {5},
pages = {3691--3701},
doi = {10.1121/1.4966592},
url = {https://doi.org/10.1121/1.4966592}
} YIN-Bird: Improved Pitch Tracking for Bird Vocalisations
Colm O'Reilly, Nicola M. Marples, David J. Kelly, Naomi Harte
Interspeech 2016
@inproceedings{O_Reilly2016,
title = {{YIN}-Bird: Improved Pitch Tracking for Bird Vocalisations},
author = {Colm O'Reilly and Nicola M. Marples and David J. Kelly and Naomi Harte},
year = {2016},
month = {sep},
booktitle = {Interspeech 2016},
publisher = {Isca},
doi = {10.21437/interspeech.2016-90},
url = {https://doi.org/10.21437/interspeech.2016-90}
} An alternative matting Laplacian
François Pitié
2016 IEEE International Conference on Image Processing (ICIP)
@inproceedings{Piti_e2016a,
title = {An alternative matting Laplacian},
author = {Fran\c{c}ois Piti\'{e}},
year = {2016},
month = {sep},
booktitle = {2016 {IEEE} International Conference on Image Processing ({ICIP})},
publisher = {Ieee},
doi = {10.1109/icip.2016.7533035},
url = {https://doi.org/10.1109/icip.2016.7533035}
} Rank Reduced Alternative Matting Laplacian
François Pitié
Proceedings of the 13th European Conference on Visual Media Production (CVMP 2016) - CVMP 2016
@inproceedings{Piti_e2016b,
title = {Rank Reduced Alternative Matting Laplacian},
author = {Fran\c{c}ois Piti\'{e}},
year = {2016},
booktitle = {Proceedings of the 13th European Conference on Visual Media Production
({CVMP} 2016) - {CVMP} 2016
},
publisher = {{ACM} Press},
doi = {10.1145/2998559.2998566},
url = {https://doi.org/10.1145/2998559.2998566}
} Geometry-driven quantization for omnidirectional image coding
Francesca De Simone, Pascal Frossard, Paul Wilkins, Neil Birkbeck, Anil Kokaram
2016 Picture Coding Symposium (PCS)
@inproceedings{Simone2016,
title = {Geometry-driven quantization for omnidirectional image coding},
author = {Francesca De Simone and Pascal Frossard and Paul Wilkins and Neil Birkbeck
and Anil Kokaram
},
year = {2016},
booktitle = {2016 Picture Coding Symposium ({PCS})},
publisher = {Ieee},
doi = {10.1109/pcs.2016.7906402},
url = {https://doi.org/10.1109/pcs.2016.7906402}
} Bitrate classification of twice-encoded audio using objective quality features
Colm Sloan, Naomi Harte, Damien Kelly, Anil Kokaram, Andrew Hines
2016 Eighth International Conference on Quality of Multimedia Experience (QoMEX)
@inproceedings{Sloan2016,
title = {Bitrate classification of twice-encoded audio using objective quality
features
},
author = {Colm Sloan and Naomi Harte and Damien Kelly and Anil Kokaram and Andrew
Hines
},
year = {2016},
month = {jun},
booktitle = {2016 Eighth International Conference on Quality of Multimedia Experience
({QoMEX})
},
publisher = {Ieee},
doi = {10.1109/qomex.2016.7498956},
url = {https://doi.org/10.1109/qomex.2016.7498956}
} Prediction of Emotions from Text using Sentiment Analysis for Expressive Speech Synthesis
Eva Vanmassenhove, João Cabral, Fasih Haider
9th ISCA Speech Synthesis Workshop
@inproceedings{Vanmassenhove2016,
title = {Prediction of Emotions from Text using Sentiment Analysis for Expressive
Speech Synthesis
},
author = {Eva Vanmassenhove and Jo\~{a}o Cabral and Fasih Haider},
year = {2016},
month = {sep},
booktitle = {9th {ISCA} Speech Synthesis Workshop},
publisher = {Isca},
doi = {10.21437/ssw.2016-4},
url = {https://doi.org/10.21437/ssw.2016-4}
} A cloud-based large-scale distributed video analysis system
Yongzhe Wang, Wei-Ta Chen, Huahui Wu, Anil Kokaram, Jaron Schaeffer
2016 IEEE International Conference on Image Processing (ICIP)
@inproceedings{Wang2016a,
title = {A cloud-based large-scale distributed video analysis system},
author = {Yongzhe Wang and Wei-Ta Chen and Huahui Wu and Anil Kokaram and Jaron
Schaeffer
},
year = {2016},
month = {sep},
booktitle = {2016 {IEEE} International Conference on Image Processing ({ICIP})},
publisher = {Ieee},
doi = {10.1109/icip.2016.7532608},
url = {https://doi.org/10.1109/icip.2016.7532608}
} A perceptual visibility metric for banding artifacts
Yilin Wang, Sang-Uok Kum, Chao Chen, Anil Kokaram
2016 IEEE International Conference on Image Processing (ICIP)
@inproceedings{Wang2016b,
title = {A perceptual visibility metric for banding artifacts},
author = {Yilin Wang and Sang-Uok Kum and Chao Chen and Anil Kokaram},
year = {2016},
month = {sep},
booktitle = {2016 {IEEE} International Conference on Image Processing ({ICIP})},
publisher = {Ieee},
doi = {10.1109/icip.2016.7532722},
url = {https://doi.org/10.1109/icip.2016.7532722}
} Double-Tip Artifact Removal From Atomic Force Microscopy Images
Yun-Feng Wang, Jason I. Kilpatrick, Suzanne Jarvis, Frank Boland, Anil Kokaram et al.
IEEE Transactions on Image Processing , vol. 25 , no. 6 , pp. 2774--2788
@article{Wang2016c,
title = {Double-Tip Artifact Removal From Atomic Force Microscopy Images},
author = {Yun-Feng Wang and Jason I. Kilpatrick and Suzanne Jarvis and Frank Boland
and Anil Kokaram and David Corrigan
},
year = {2016},
month = {jun},
journal = {IEEE Transactions on Image Processing},
publisher = {Institute of Electrical and Electronics Engineers ({IEEE})},
volume = {25},
number = {6},
pages = {2774--2788},
doi = {10.1109/tip.2016.2532239},
url = {https://doi.org/10.1109/tip.2016.2532239}
} 2015
TCD-TIMIT: An Audio-Visual Corpus of Continuous Speech
Naomi Harte, Eoin Gillen
IEEE Transactions on Multimedia , vol. 17 , no. 5 , pp. 603--615
@article{Harte2015a,
title = {{TCD}-{TIMIT}: An Audio-Visual Corpus of Continuous Speech},
author = {Naomi Harte and Eoin Gillen},
year = {2015},
month = {may},
journal = {IEEE Transactions on Multimedia},
publisher = {Institute of Electrical and Electronics Engineers ({IEEE})},
volume = {17},
number = {5},
pages = {603--615},
doi = {10.1109/tmm.2015.2407694},
url = {https://doi.org/10.1109/tmm.2015.2407694}
} TCD-VoIP, a research database of degraded speech for assessing quality in VoIP applications
Naomi Harte, Eoin Gillen, Andrew Hines
2015 Seventh International Workshop on Quality of Multimedia Experience (QoMEX)
@inproceedings{Harte2015b,
title = {{TCD}-{VoIP}, a research database of degraded speech for assessing quality
in {VoIP} applications
},
author = {Naomi Harte and Eoin Gillen and Andrew Hines},
year = {2015},
month = {may},
booktitle = {2015 Seventh International Workshop on Quality of Multimedia Experience
({QoMEX})
},
publisher = {Ieee},
doi = {10.1109/qomex.2015.7148100},
url = {https://doi.org/10.1109/qomex.2015.7148100}
} ViSQOL: an objective speech quality model
Andrew Hines, Jan Skoglund, Anil Kokaram, Naomi Harte
Journal on Audio, Speech, and Music Processing , vol. 2015 , no. 1
@article{Hines2015a,
title = {{ViSQOL}: an objective speech quality model},
author = {Andrew Hines and Jan Skoglund and Anil Kokaram and Naomi Harte},
year = {2015},
month = {may},
journal = {Journal on Audio, Speech, and Music Processing},
publisher = {Springer Science and Business Media {LLC}},
volume = {2015},
number = {1},
doi = {10.1186/s13636-015-0054-9},
url = {https://doi.org/10.1186/s13636-015-0054-9}
} ViSQOLAudio: An objective audio quality metric for low bitrate codecs
Andrew Hines, Eoin Gillen, Damien Kelly, Jan Skoglund, Anil Kokaram et al.
The Journal of the Acoustical Society of America , vol. 137 , no. 6 , pp. El449--el455
@article{Hines2015b,
title = {{ViSQOLAudio}: An objective audio quality metric for low bitrate codecs},
author = {Andrew Hines and Eoin Gillen and Damien Kelly and Jan Skoglund and Anil
Kokaram and Naomi Harte
},
year = {2015},
month = {jun},
journal = {The Journal of the Acoustical Society of America},
publisher = {Acoustical Society of America ({ASA})},
volume = {137},
number = {6},
pages = {El449--el455},
doi = {10.1121/1.4921674},
url = {https://doi.org/10.1121/1.4921674}
} Forensic comparison of ageing voices from automatic and auditory perspectives
Finnian Kelly, Naomi Harte
Ijsll , vol. 22 , no. 2 , pp. 167--202
@article{Kelly2015,
title = {Forensic comparison of ageing voices from automatic and auditory
perspectives
},
author = {Finnian Kelly and Naomi Harte},
year = {2015},
month = {oct},
journal = {Ijsll},
publisher = {Equinox Publishing},
volume = {22},
number = {2},
pages = {167--202},
doi = {10.1558/ijsll.v22i2.21760},
url = {https://doi.org/10.1558/ijsll.v22i2.21760}
} Special Issue in Honour of William J. (Bill) Fitzgerald
Ercan E. Kuruoglu, Joan Lasenby, A. Taylan Cemgil, Anil Kokaram, Robin D. Morris
Digital Signal Processing , vol. 47 , pp. 1--2
@article{Kuruoglu2015,
title = {Special Issue in Honour of William J. (Bill) Fitzgerald},
author = {Ercan E. Kuruoglu and Joan Lasenby and A. Taylan Cemgil and Anil Kokaram
and Robin D. Morris
},
year = {2015},
month = {dec},
journal = {Digital Signal Processing},
publisher = {Elsevier {BV}},
volume = {47},
pages = {1--2},
doi = {10.1016/j.dsp.2015.09.001},
url = {https://doi.org/10.1016/j.dsp.2015.09.001}
} Multipass encoding for reducing pulsing artifacts in cloud based video transcoding
Yao-Chung Lin, Hugh Denman, Anil Kokaram
2015 IEEE International Conference on Image Processing (ICIP)
@inproceedings{Lin2015,
title = {Multipass encoding for reducing pulsing artifacts in cloud based video
transcoding
},
author = {Yao-Chung Lin and Hugh Denman and Anil Kokaram},
year = {2015},
month = {sep},
booktitle = {2015 {IEEE} International Conference on Image Processing ({ICIP})},
publisher = {Ieee},
doi = {10.1109/icip.2015.7350931},
url = {https://doi.org/10.1109/icip.2015.7350931}
} Quantifying Difference in Vocalizations of Bird Populations
Colm O'Reilly, Nicola M. Marples, David J. Kelly, Naomi Harte
INTERSPEECH 2015 16th Annual Conference of the International Speech Communication Association, September 610, Dresden, Germany , pp. 3417--3421
@inproceedings{O_Reilly2015,
title = {Quantifying Difference in Vocalizations of Bird Populations},
author = {Colm O'Reilly and Nicola M. Marples and David J. Kelly and Naomi Harte},
year = {2015},
booktitle = {INTERSPEECH 2015 16th Annual Conference of the International Speech
Communication Association, September 610, Dresden, Germany
},
pages = {3417--3421}
} An Analysis of the Impact of Playout Delay Adjustments introduced by VoIP Jitter Buffers on Listening Speech Quality
Peter Pocta, Hugh Melvin, Andrew Hines
Acta Acustica united with Acustica , vol. 101 , no. 3 , pp. 616--631
@article{Pocta2015,
title = {An Analysis of the Impact of Playout Delay Adjustments introduced by {VoIP}
Jitter Buffers on Listening Speech Quality
},
author = {Peter Pocta and Hugh Melvin and Andrew Hines},
year = {2015},
month = {may},
journal = {Acta Acustica united with Acustica},
publisher = {S. Hirzel Verlag},
volume = {101},
number = {3},
pages = {616--631},
doi = {10.3813/aaa.918857},
url = {https://doi.org/10.3813/aaa.918857}
} Segmentation and Inpainting for Stereoscopic Videos
Félix Raimbault
@phdthesis{Raimbault2015,
title = {Segmentation and Inpainting for Stereoscopic Videos},
author = {F\'{e}lix Raimbault},
year = {2015},
school = {Trinity College Dublin}
} Enhancement, Summarization and Analysis of Underwater Videos of Nephrops Habitats
Ken Sooknanan
@phdthesis{Sooknanan2015,
title = {Enhancement, Summarization and Analysis of Underwater Videos of Nephrops
Habitats
},
author = {Ken Sooknanan},
year = {2015},
school = {Trinity College Dublin}
} 2014
Advanced video debanding
Gary Baugh, Anil Kokaram, François Pitié
Proceedings of the 11th European Conference on Visual Media Production
@inproceedings{Baugh2014,
title = {Advanced video debanding},
author = {Gary Baugh and Anil Kokaram and Fran\c{c}ois Piti\'{e}},
year = {2014},
month = {nov},
booktitle = {Proceedings of the 11th European Conference on Visual Media Production},
publisher = {Acm},
doi = {10.1145/2668904.2668912},
url = {https://doi.org/10.1145/2668904.2668912}
} A Video Database for the Development of Stereo-3D Post-Production Algorithms
David Corrigan, François Pitié, Marcin Gorzel, Gavin Kearney, Valerie Morris et al.
JVRB - Journal of Virtual Reality and Broadcasting 2014
@inproceedings{Corrigan2014,
title = {A Video Database for the Development of Stereo-3{D} Post-Production
Algorithms
},
author = {David Corrigan and Fran\c{c}ois Piti\'{e} and Marcin Gorzel and Gavin
Kearney and Valerie Morris and Rankin Andrew and Mark Linnane and Mick
O'Dea and Clive Lee and Anil Kokaram
},
year = {2014},
booktitle = {JVRB - Journal of Virtual Reality and Broadcasting 2014}
} Building a Database of Political Speech
Ailbhe Cullen, Andrew Hines, Naomi Harte
Proceedings of the 4th International Workshop on Audio/Visual Emotion Challenge - AVEC '14
@inproceedings{Cullen2014,
title = {Building a Database of Political Speech},
author = {Ailbhe Cullen and Andrew Hines and Naomi Harte},
year = {2014},
booktitle = {Proceedings of the 4th International Workshop on Audio/Visual Emotion
Challenge - {AVEC} '14
},
publisher = {{ACM} Press},
doi = {10.1145/2661806.2661808},
url = {https://doi.org/10.1145/2661806.2661808}
} Investigation of Ambisonic Rendering of Elevated Sound Sources
Marcin Gorzel, Gavin Kearney, Frank Boland
Audio Engineering Society 55th International Conference: Spatial Audio
@inproceedings{Gorzel2014,
title = {Investigation of Ambisonic Rendering of Elevated Sound Sources},
author = {Marcin Gorzel and Gavin Kearney and Frank Boland},
year = {2014},
month = {aug},
booktitle = {Audio Engineering Society 55th International Conference: Spatial Audio},
address = {Helsinki, Finland}
} Perceived Audio Quality for Streaming Stereo Music
Andrew Hines, Eoin Gillen, Damien Kelly, Jan Skoglund, Anil Kokaram et al.
Proceedings of the 22nd ACM international conference on Multimedia
@inproceedings{Hines2014a,
title = {Perceived Audio Quality for Streaming Stereo Music},
author = {Andrew Hines and Eoin Gillen and Damien Kelly and Jan Skoglund and Anil
Kokaram and Naomi Harte
},
year = {2014},
month = {nov},
booktitle = {Proceedings of the 22nd {ACM} international conference on Multimedia},
publisher = {Acm},
address = {Orlando, FL, USA, 2014},
doi = {10.1145/2647868.2655025},
url = {https://doi.org/10.1145/2647868.2655025}
} Robustness And Prediction Accuracy Of Machine Learning For Objective Visual Quality Assessment
Andrew Hines, Paul Kendrick, Adriaan Barri, Manish Narwaria, J. A. Redi.
Eusipco
@inproceedings{Hines2014b,
title = {Robustness And Prediction Accuracy Of Machine Learning For Objective Visual
Quality Assessment
},
author = {Andrew Hines and Paul Kendrick and Adriaan Barri and Manish Narwaria and J.
A. Redi.
},
year = {2014},
month = {sep},
booktitle = {Eusipco},
address = {Lisbon, Portugal}
} Automatic Recognition of Ageing Speakers
Finnian Kelly
@phdthesis{Kelly2014a,
title = {Automatic Recognition of Ageing Speakers},
author = {Finnian Kelly},
year = {2014},
school = {Trinity College Dublin}
} Detecting Arrivals in Room Impulse Responses With Dynamic Time Warping
Ian J. Kelly, Frank Boland
IEEE/ACM Transactions on Audio, Speech, and Language Processing , vol. 22 , no. 7 , pp. 1139--1147
@article{Kelly2014b,
title = {Detecting Arrivals in Room Impulse Responses With Dynamic Time Warping},
author = {Ian J. Kelly and Frank Boland},
year = {2014},
month = {jul},
journal = {IEEE/{ACM} Transactions on Audio, Speech, and Language Processing},
publisher = {Institute of Electrical and Electronics Engineers ({IEEE})},
volume = {22},
number = {7},
pages = {1139--1147},
doi = {10.1109/taslp.2014.2321472},
url = {https://doi.org/10.1109/taslp.2014.2321472}
} Phase and Randomness in Acoustic Responses
Ian J. Kelly, B. O'Toole, F.M. Boland, Marcin Gorzel
25th IET Irish Signals & Systems Conference 2014 and 2014 China-Ireland International Conference on Information and Communities Technologies (ISSC 2014/CIICT 2014)
@inproceedings{Kelly2014c,
title = {Phase and Randomness in Acoustic Responses},
author = {Ian J. Kelly and B. O'Toole and F.M. Boland and Marcin Gorzel},
year = {2014},
booktitle = {25th {IET} Irish Signals {\&} Systems Conference 2014 and 2014
China-Ireland International Conference on Information and Communities
Technologies ({ISSC} 2014/{CIICT} 2014)
},
publisher = {Institution of Engineering and Technology},
doi = {10.1049/cp.2014.0657},
url = {https://doi.org/10.1049/cp.2014.0657}
} Randomness and the reverberation time, RTinf, of acoustic responses
Ian J. Kelly, Frank Boland
2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)
@inproceedings{Kelly2014d,
title = {Randomness and the reverberation time, {RT}$\less$inf$\less$/inf$\greater$,
of acoustic responses
},
author = {Ian J. Kelly and Frank Boland},
year = {2014},
month = {may},
booktitle = {2014 {IEEE} International Conference on Acoustics, Speech and Signal
Processing ({ICASSP})
},
publisher = {Ieee},
doi = {10.1109/icassp.2014.6855204},
url = {https://doi.org/10.1109/icassp.2014.6855204}
} Prediction Quality Assessment
Matjaž Kukar
Conformal Prediction for Reliable Machine Learning , pp. 145--166
@incollection{Kukar2014,
title = {Prediction Quality Assessment},
author = {Matja{\v{z}} Kukar},
year = {2014},
booktitle = {Conformal Prediction for Reliable Machine Learning},
publisher = {Elsevier},
pages = {145--166},
doi = {10.1016/b978-0-12-398537-8.00008-0},
url = {https://doi.org/10.1016/b978-0-12-398537-8.00008-0}
} Effect of long-term ageing on i-vector speaker verification
David van Leeuwen, Finnian Kelly, Rahim Saeidi, Naomi Harte
InterSpeech 2014
@inproceedings{Leeuwen2014,
title = {Effect of long-term ageing on i-vector speaker verification},
author = {David van Leeuwen and Finnian Kelly and Rahim Saeidi and Naomi Harte},
year = {2014},
month = {sep},
booktitle = {InterSpeech 2014},
address = {Singapore}
} Virtual 5.1 Surround Sound Localization using Head-Tracking Devices
B.C. O'Toole, L. O'Sullivan, Ian J. Kelly, Frank Boland, Marcin Gorzel et al.
25th IET Irish Signals & Systems Conference 2014 and 2014 China-Ireland International Conference on Information and Communities Technologies (ISSC 2014/CIICT 2014)
@inproceedings{O_Toole2014,
title = {Virtual 5.1 Surround Sound Localization using Head-Tracking Devices},
author = {B.C. O'Toole and L. O'Sullivan and Ian J. Kelly and Frank Boland and Marcin
Gorzel and Gavin Kearney
},
year = {2014},
booktitle = {25th {IET} Irish Signals {\&} Systems Conference 2014 and 2014
China-Ireland International Conference on Information and Communities
Technologies ({ISSC} 2014/{CIICT} 2014)
},
publisher = {Institution of Engineering and Technology},
doi = {10.1049/cp.2014.0656},
url = {https://doi.org/10.1049/cp.2014.0656}
} Assessment of Audio/Video synchronisation in streaming media
François Pitié, Damien Kelly, Thierry Foucu, Naomi Harte, Anil Kokaram
2014 Sixth International Workshop on Quality of Multimedia Experience (QoMEX)
@inproceedings{Piti_e2014,
title = {Assessment of Audio/Video synchronisation in streaming media},
author = {Fran\c{c}ois Piti\'{e} and Damien Kelly and Thierry Foucu and Naomi Harte
and Anil Kokaram
},
year = {2014},
month = {sep},
booktitle = {2014 Sixth International Workshop on Quality of Multimedia Experience
({QoMEX})
},
publisher = {Ieee},
doi = {10.1109/qomex.2014.6982315},
url = {https://doi.org/10.1109/qomex.2014.6982315}
} Towards Automated Classification of Seabed Substrates in Underwater Video
Matthew Pugh, Bernard Tiddeman, Hannah Dee, Philip Hughes
2014 ICPR Workshop on Computer Vision for Analysis of Underwater Imagery
@inproceedings{Pugh2014,
title = {Towards Automated Classification of Seabed Substrates in Underwater Video},
author = {Matthew Pugh and Bernard Tiddeman and Hannah Dee and Philip Hughes},
year = {2014},
month = {aug},
booktitle = {2014 {ICPR} Workshop on Computer Vision for Analysis of Underwater Imagery},
publisher = {Ieee},
doi = {10.1109/cvaui.2014.18},
url = {https://doi.org/10.1109/cvaui.2014.18}
} Bleed-Through Document Image Restoration
Róisín Rowley-Brooke
@phdthesis{Rowley_Brooke2014,
title = {Bleed-Through Document Image Restoration},
author = {R\'{o}is\'{\i}n Rowley-Brooke},
year = {2014},
school = {Trinity College Dublin}
} Mosaics for Nephrops detection in underwater survey videos
Ken Sooknanan, Jennifer Doyle, Colm Lordan, James Wilson, Anil Kokaram et al.
2014 Oceans - St. John's
@inproceedings{Sooknanan2014,
title = {Mosaics for Nephrops detection in underwater survey videos},
author = {Ken Sooknanan and Jennifer Doyle and Colm Lordan and James Wilson and Anil
Kokaram and David Corrigan
},
year = {2014},
month = {sep},
booktitle = {2014 Oceans - St. John's},
publisher = {Ieee},
doi = {10.1109/oceans.2014.7003142},
url = {https://doi.org/10.1109/oceans.2014.7003142}
} Classification of Seabed Type from Underwater Video
Steven Tyner, James Wilson, David Corrigan
Irish Machine Vision and Image Processing Conference (IMVIP)
@inproceedings{Tyner2014,
title = {Classification of Seabed Type from Underwater Video},
author = {Steven Tyner and James Wilson and David Corrigan},
year = {2014},
month = {aug},
booktitle = {Irish Machine Vision and Image Processing Conference (IMVIP)},
address = {Derry, Ireland}
} Automated registration of low and high resolution atomic force microscopy images using scale invariant features
Yun-Feng Wang, Jason I. Kilpatrick, Suzanne Jarvis, Frank Boland, Anil Kokaram et al.
2014 IEEE International Conference on Image Processing (ICIP)
@inproceedings{Wang2014,
title = {Automated registration of low and high resolution atomic force microscopy
images using scale invariant features
},
author = {Yun-Feng Wang and Jason I. Kilpatrick and Suzanne Jarvis and Frank Boland
and Anil Kokaram and David Corrigan
},
year = {2014},
month = {oct},
booktitle = {2014 {IEEE} International Conference on Image Processing ({ICIP})},
publisher = {Ieee},
doi = {10.1109/icip.2014.7026185},
url = {https://doi.org/10.1109/icip.2014.7026185}
} 2013
Exploiting randomness in acoustic impulse responses to achieve headphone compensation through deconvolution
Ian J. Kellyand Frank Boland
The Journal of the Acoustical Society of America 133 (5) , vol. 133 , no. 5 , pp. 2778--2787
@article{Boland2013,
title = {Exploiting randomness in acoustic impulse responses to achieve headphone
compensation through deconvolution
},
author = {Ian J. Kellyand Frank Boland},
year = {2013},
journal = {The Journal of the Acoustical Society of America 133 (5)},
volume = {133},
number = {5},
pages = {2778--2787}
} Depth perception of audio sources in stereo 3D environments
David Corrigan, Marcin Gorzel, John Squires, Frank Boland
Stereoscopic Displays and Applications XXIV
@inproceedings{Corrigan2013,
title = {Depth perception of audio sources in stereo 3D environments},
author = {David Corrigan and Marcin Gorzel and John Squires and Frank Boland},
year = {2013},
month = {mar},
booktitle = {Stereoscopic Displays and Applications {XXIV}},
publisher = {Spie},
doi = {10.1117/12.2000713},
url = {https://doi.org/10.1117/12.2000713},
editor = {Andrew J. Woods and Nicolas S. Holliman and Gregg E. Favalora}
} Creaky Voice and the Classification of Affect
Ailbhe Cullen, John Kane, Thomas Drugman, Naomi Harte
Workshop on Affective Social Speech Signals (WASSS)
@inproceedings{Cullen2013a,
title = {Creaky Voice and the Classification of Affect},
author = {Ailbhe Cullen and John Kane and Thomas Drugman and Naomi Harte},
year = {2013},
booktitle = {Workshop on Affective Social Speech Signals (WASSS)},
address = {Grenoble, France}
} Late Integration of Features for Acoustic Emotion Recognition
Ailbhe Cullen, Naomi Harte
European Signal Processing Conference (EUSIPCO)
@inproceedings{Cullen2013b,
title = {Late Integration of Features for Acoustic Emotion Recognition},
author = {Ailbhe Cullen and Naomi Harte},
year = {2013},
booktitle = {European Signal Processing Conference (EUSIPCO)},
address = {Marrakech, Morocco}
} Blotch and scratch removal in archived film using a semi-transparent corruption model and a ground-truth generation technique
Mohamed A Elgharib, François Pitié, Anil Kokaram
Journal on Image and Video Processing , vol. 2013 , no. 1
@article{Elgharib2013a,
title = {Blotch and scratch removal in archived film using a semi-transparent
corruption model and a ground-truth generation technique
},
author = {Mohamed A Elgharib and Fran\c{c}ois Piti\'{e} and Anil Kokaram},
year = {2013},
month = {jun},
journal = {Journal on Image and Video Processing},
publisher = {Springer Science and Business Media {LLC}},
volume = {2013},
number = {1},
doi = {10.1186/1687-5281-2013-33},
url = {https://doi.org/10.1186/1687-5281-2013-33}
} User-assisted reflection detection and feature point tracking
Mohamed A. Elgharib, François Pitié, Anil Kokaram and Venkatesh Saligrama
Proceedings of the 10th European Conference on Visual Media Production - CVMP '13
@inproceedings{Elgharib2013b,
title = {User-assisted reflection detection and feature point tracking},
author = {Mohamed A. Elgharib and Fran\c{c}ois Piti\'{e} and Anil Kokaram and
Venkatesh Saligrama
},
year = {2013},
booktitle = {Proceedings of the 10th European Conference on Visual Media Production -
{CVMP} '13
},
publisher = {{ACM} Press},
doi = {10.1145/2534008.2534011},
url = {https://doi.org/10.1145/2534008.2534011}
} Identifying new bird species from differences in birdsong.
Naomi Harte, Sadhbh Murphy, David J. Kelly, Nicola M. Marples
Interspeech , pp. 2900--2904
@inproceedings{Harte2013,
title = {Identifying new bird species from differences in birdsong.},
author = {Naomi Harte and Sadhbh Murphy and David J. Kelly and Nicola M. Marples},
year = {2013},
booktitle = {Interspeech},
publisher = {Isca},
pages = {2900--2904},
crossref = {conf/interspeech/2013},
ee = {http://www.isca-speech.org/archive/interspeech\_2013/i13\_2900.html},
interhash = {f38c673a487bbc70313d08f1fdaeb71f},
intrahash = {9a761c48439d39a19375c39207159871},
keywords = {dblp},
timestamp = {2014-01-27t00:00:00.000+0100}
} Detailed comparative analysis of PESQ and VISQOL behaviour in the context of playout delay adjustments introduced by VOIP jitter buffer algorithms
Andrew Hines, Peter Pocta, Hugh Melvin
2013 Fifth International Workshop on Quality of Multimedia Experience (QoMEX)
@inproceedings{Hines2013a,
title = {Detailed comparative analysis of PESQ and VISQOL behaviour in the context
of playout delay adjustments introduced by VOIP jitter buffer algorithms
},
author = {Andrew Hines and Peter Pocta and Hugh Melvin},
year = {2013},
month = {jul},
booktitle = {2013 Fifth International Workshop on Quality of Multimedia Experience
(QoMEX)
},
publisher = {Ieee},
doi = {10.1109/qomex.2013.6603195},
url = {https://doi.org/10.1109/qomex.2013.6603195}
} Monitoring the Effects of Temporal Clipping on VoIP Speech Quality
Andrew Hines, Jan Skoglund, Anil Kokaram, Naomi Harte
Interspeech 2013
@inproceedings{Hines2013b,
title = {Monitoring the Effects of Temporal Clipping on Vo{IP} Speech Quality},
author = {Andrew Hines and Jan Skoglund and Anil Kokaram and Naomi Harte},
year = {2013},
booktitle = {Interspeech 2013},
address = {Lyon, France}
} Robustness of speech quality metrics to background noise and network degradations: Comparing ViSQOL, PESQ and POLQA
Andrew Hines, Jan Skoglund, Anil Kokaram, Naomi Harte
2013 IEEE International Conference on Acoustics, Speech and Signal Processing
@inproceedings{Hines2013c,
title = {Robustness of speech quality metrics to background noise and network
degradations: Comparing {ViSQOL}, {PESQ} and {POLQA}
},
author = {Andrew Hines and Jan Skoglund and Anil Kokaram and Naomi Harte},
year = {2013},
month = {may},
booktitle = {2013 {IEEE} International Conference on Acoustics, Speech and Signal
Processing
},
publisher = {Ieee},
doi = {10.1109/icassp.2013.6638348},
url = {https://doi.org/10.1109/icassp.2013.6638348}
} Auditory detectability of vocal ageing and its effect on forensic automatic speaker recognition
Finnian Kelly, Naomi Harte
InterSpeech 2013
@inproceedings{Kelly2013a,
title = {Auditory detectability of vocal ageing and its effect on forensic automatic
speaker recognition
},
author = {Finnian Kelly and Naomi Harte},
year = {2013},
booktitle = {InterSpeech 2013},
address = {Lyon, France}
} Eigenageing Compensation for Speaker Verification
Finnian Kelly, Niko Brummer, Naomi Harte
InterSpeech 2013
@inproceedings{Kelly2013b,
title = {Eigenageing Compensation for Speaker Verification},
author = {Finnian Kelly and Niko Brummer and Naomi Harte},
year = {2013},
booktitle = {InterSpeech 2013},
address = {Lyon, France}
} Exploiting randomness in acoustic impulse responses to achieve headphone compensation through deconvolution
Ian J. Kelly, Frank Boland
The Journal of the Acoustical Society of America , vol. 133 , no. 5 , pp. 2778--2787
@article{Kelly2013c,
title = {Exploiting randomness in acoustic impulse responses to achieve headphone
compensation through deconvolution
},
author = {Ian J. Kelly and Frank Boland},
year = {2013},
month = {may},
journal = {The Journal of the Acoustical Society of America},
publisher = {Acoustical Society of America ({ASA})},
volume = {133},
number = {5},
pages = {2778--2787},
doi = {10.1121/1.4798799},
url = {https://doi.org/10.1121/1.4798799}
} Speaker verification in score-ageing-quality classification space
Finnian Kelly, Andrzej Drygajlo, Naomi Harte
Computer Speech $&$ Language , vol. 27 , no. 5 , pp. 1068--1084
@article{Kelly2013d,
title = {Speaker verification in score-ageing-quality classification space},
author = {Finnian Kelly and Andrzej Drygajlo and Naomi Harte},
year = {2013},
month = {aug},
journal = {Computer Speech $\&$ Language},
publisher = {Elsevier {BV}},
volume = {27},
number = {5},
pages = {1068--1084},
doi = {10.1016/j.csl.2012.12.005},
url = {https://doi.org/10.1016/j.csl.2012.12.005}
} The impact of ageing on speech-based biometric systems
Finnian Kelly, Naomi Harte
'Age Factors in Biometric Processing'
@incollection{Kelly2013e,
title = {The impact of ageing on speech-based biometric systems},
author = {Finnian Kelly and Naomi Harte},
year = {2013},
booktitle = {'Age Factors in Biometric Processing'},
publisher = {Iet},
isbn = {978-1-84919-502-7},
editor = {Michael Fairhurst}
} Shape Models for Image Segmentation in Microscopy
Kangyu Pan
@phdthesis{Pan2013,
title = {Shape Models for Image Segmentation in Microscopy},
author = {Kangyu Pan},
year = {2013},
school = {Trinity College Dublin}
} Adaptive video stabilisation with dominant motion layer estimation for home video and TV broadcast
Félix Raimbault, Yalcin Incesu
2013 IEEE International Conference on Image Processing
@inproceedings{Raimbault2013a,
title = {Adaptive video stabilisation with dominant motion layer estimation for home
video and {TV} broadcast
},
author = {F\'{e}lix Raimbault and Yalcin Incesu},
year = {2013},
month = {sep},
booktitle = {2013 {IEEE} International Conference on Image Processing},
publisher = {Ieee},
doi = {10.1109/icip.2013.6738788},
url = {https://doi.org/10.1109/icip.2013.6738788}
} User-assisted sparse stereo-video segmentation
Félix Raimbault, François Pitié, Anil Kokaram
Proceedings of the 10th European Conference on Visual Media Production - CVMP '13
@inproceedings{Raimbault2013b,
title = {User-assisted sparse stereo-video segmentation},
author = {F\'{e}lix Raimbault and Fran\c{c}ois Piti\'{e} and Anil Kokaram},
year = {2013},
booktitle = {Proceedings of the 10th European Conference on Visual Media Production -
{CVMP} '13
},
publisher = {{ACM} Press},
doi = {10.1145/2534008.2534027},
url = {https://doi.org/10.1145/2534008.2534027}
} A Non-parametric Framework for Document Bleed-through Removal
Róisín Rowley-Brooke, François Pitié, Anil Kokaram
2013 IEEE Conference on Computer Vision and Pattern Recognition
@inproceedings{Rowley_Brooke2013a,
title = {A Non-parametric Framework for Document Bleed-through Removal},
author = {R\'{o}is\'{\i}n Rowley-Brooke and Fran\c{c}ois Piti\'{e} and Anil Kokaram},
year = {2013},
month = {jun},
booktitle = {2013 {IEEE} Conference on Computer Vision and Pattern Recognition},
publisher = {Ieee},
doi = {10.1109/cvpr.2013.380},
url = {https://doi.org/10.1109/cvpr.2013.380}
} Degraded manuscript restoration: A case study
Róisín Rowley-Brooke, François Pitié, Anil Kokaram
Annual Conference of the Society for Musicology in Ireland (SMI)
@inproceedings{Rowley_Brooke2013b,
title = {Degraded manuscript restoration: {A} case study},
author = {R\'{o}is\'{\i}n Rowley-Brooke and Fran\c{c}ois Piti\'{e} and Anil Kokaram},
year = {2013},
booktitle = {Annual Conference of the Society for Musicology in Ireland (SMI)},
address = {Maynooth,Ireland}
} Nonrigid recto-verso registration using page outline structure and content preserving warps
Róisín Rowley-Brooke, François Pitié, Anil Kokaram
Proceedings of the 2nd International Workshop on Historical Document Imaging and Processing - HIP '13
@inproceedings{Rowley_Brooke2013c,
title = {Nonrigid recto-verso registration using page outline structure and content
preserving warps
},
author = {R\'{o}is\'{\i}n Rowley-Brooke and Fran\c{c}ois Piti\'{e} and Anil Kokaram},
year = {2013},
booktitle = {Proceedings of the 2nd International Workshop on Historical Document
Imaging and Processing - {HIP} '13
},
publisher = {{ACM} Press},
doi = {10.1145/2501115.2501124},
url = {https://doi.org/10.1145/2501115.2501124}
} Residual Life Prediction of Rotating Machines Using Acoustic Noise Signals
Patricia Scanlon, Darren F. Kavanagh, Frank Boland
IEEE Transactions on Instrumentation and Measurement , vol. 62 , no. 1 , pp. 95--108
@article{Scanlon2013,
title = {Residual Life Prediction of Rotating Machines Using Acoustic Noise Signals},
author = {Patricia Scanlon and Darren F. Kavanagh and Frank Boland},
year = {2013},
month = {jan},
journal = {IEEE Transactions on Instrumentation and Measurement},
publisher = {Institute of Electrical and Electronics Engineers ({IEEE})},
volume = {62},
number = {1},
pages = {95--108},
doi = {10.1109/tim.2012.2212508},
url = {https://doi.org/10.1109/tim.2012.2212508}
} Mosaics For Burrow Detection in Underwater Surveillance Video
Ken Sooknanan, Jennifer Doyle, James Wilson, Naomi Harte, Anil Kokaram et al.
Oceans 2013
@inproceedings{Sooknanan2013,
title = {Mosaics For Burrow Detection in Underwater Surveillance Video},
author = {Ken Sooknanan and Jennifer Doyle and James Wilson and Naomi Harte and Anil
Kokaram and David Corrigan
},
year = {2013},
booktitle = {Oceans 2013},
address = {San Diego, USA}
} 2012
Phoneme-to-Viseme Mapping for Visual Speech Recognition
Luca Cappelletta, Naomi Harte
International Conference on Patter Recognition Applications and Methods (ICPRAM) , vol. 2 , pp. 322--329
@inproceedings{Cappelletta2012,
title = {Phoneme-to-Viseme Mapping for Visual Speech Recognition},
author = {Luca Cappelletta and Naomi Harte},
year = {2012},
month = {feb},
booktitle = {International Conference on Patter Recognition Applications and Methods
(ICPRAM)
},
address = {Vilamoura, Portugal},
volume = {2},
pages = {322--329}
} Algorithms for the Digital Restoration of Torn Films
David Corrigan, Anil Kokaram, Naomi Harte
IEEE Transactions on Image Processing , vol. 21 , no. 2 , pp. 573--587
@article{Corrigan2012,
title = {Algorithms for the Digital Restoration of Torn Films},
author = {David Corrigan and Anil Kokaram and Naomi Harte},
year = {2012},
month = {feb},
journal = {IEEE Transactions on Image Processing},
publisher = {Institute of Electrical and Electronics Engineers ({IEEE})},
volume = {21},
number = {2},
pages = {573--587},
doi = {10.1109/tip.2011.2162425},
url = {https://doi.org/10.1109/tip.2011.2162425}
} Lower and upper bounds for approximation of the Kullback-Leibler divergence between Gaussian Mixture Models
J.-L. Durrieu, J.-Ph. Thiran, Finnian Kelly
2012 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)
@inproceedings{Durrieu2012,
title = {Lower and upper bounds for approximation of the Kullback-Leibler divergence
between Gaussian Mixture Models
},
author = {J.-L. Durrieu and J.-Ph. Thiran and Finnian Kelly},
year = {2012},
month = {mar},
booktitle = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
Processing ({ICASSP})
},
publisher = {Ieee},
doi = {10.1109/icassp.2012.6289001},
url = {https://doi.org/10.1109/icassp.2012.6289001}
} Distance Perception in Virtual Audio-Visual Environments
Marcin Gorzel, David Corrigan, Gavin Kearney, John Squires and Frank Boland
25th AES UK Conference: Spatial Audio in Today's 3D World
@inproceedings{Gorzel2012,
title = {Distance Perception in Virtual Audio-Visual Environments},
author = {Marcin Gorzel and David Corrigan and Gavin Kearney and John Squires and
Frank Boland
},
year = {2012},
month = {mar},
booktitle = {25th AES UK Conference: Spatial Audio in Today's 3D World},
address = {York, United Kingdom}
} Improved Speech Intelligibility with a Chimaera Hearing Aid Algorithm
Andrew Hines, Naomi Harte
InterSpeech 2012
@inproceedings{Hines2012a,
title = {Improved Speech Intelligibility with a Chimaera Hearing Aid Algorithm},
author = {Andrew Hines and Naomi Harte},
year = {2012},
month = {sep},
booktitle = {InterSpeech 2012},
address = {Portland, Oregon}
} Predicting Speech Intelligibility
Andrew Hines
@phdthesis{Hines2012b,
title = {Predicting Speech Intelligibility},
author = {Andrew Hines},
year = {2012},
school = {Trinity College Dublin}
} Speech intelligibility prediction using a Neurogram Similarity Index Measure
Andrew Hines, Naomi Harte
Speech Communication , vol. 54 , no. 2 , pp. 306--320
@article{Hines2012c,
title = {Speech intelligibility prediction using a Neurogram Similarity Index
Measure
},
author = {Andrew Hines and Naomi Harte},
year = {2012},
month = {feb},
journal = {Speech Communication},
publisher = {Elsevier {BV}},
volume = {54},
number = {2},
pages = {306--320},
doi = {10.1016/j.specom.2011.09.004},
url = {https://doi.org/10.1016/j.specom.2011.09.004}
} ViSQOL: The Virtual Speech Quality Objective Listener
Andrew Hines, Jan Skoglund, Anil Kokaram, Naomi Harte
International Workshop on Acoustic Signal Enhancement (IWAENC)
@inproceedings{Hines2012d,
title = {Vi{SQOL}: The Virtual Speech Quality Objective Listener},
author = {Andrew Hines and Jan Skoglund and Anil Kokaram and Naomi Harte},
year = {2012},
month = {sep},
booktitle = {International Workshop on Acoustic Signal Enhancement (IWAENC)},
address = {Aachen, Germany}
} Distance Perception in Interactive Virtual Acoustic Environments using First and Higher Order Ambisonic Sound Fields
Gavin Kearney, Marcin Gorzel, Henry Rice, Frank Boland
Acta Acustica united with Acustica , vol. 98 , no. 1 , pp. 61--71
@article{Kearney2012a,
title = {Distance Perception in Interactive Virtual Acoustic Environments using
First and Higher Order Ambisonic Sound Fields
},
author = {Gavin Kearney and Marcin Gorzel and Henry Rice and Frank Boland},
year = {2012},
month = {jan},
journal = {Acta Acustica united with Acustica},
publisher = {S. Hirzel Verlag},
volume = {98},
number = {1},
pages = {61--71},
doi = {10.3813/aaa.918492},
url = {https://doi.org/10.3813/aaa.918492}
} On loudspeaker rendering of auditory distance in higher order Ambisonics
Gavin Kearney, Marcin Gorzel, Frank Boland
Acoustics 2012
@inproceedings{Kearney2012b,
title = {On loudspeaker rendering of auditory distance in higher order Ambisonics},
author = {Gavin Kearney and Marcin Gorzel and Frank Boland},
year = {2012},
month = {apr},
booktitle = {Acoustics 2012},
address = {Nantes, France},
organization = {Eaa}
} On Phase and Randomness in Head Related Impulse Responses
Ian J. Kelly, Frank Boland
9th IMA International Conference on Mathematics in Signal Processing
@inproceedings{Kelly2012a,
title = {On Phase and Randomness in Head Related Impulse Responses},
author = {Ian J. Kelly and Frank Boland},
year = {2012},
month = {dec},
booktitle = {9th IMA International Conference on Mathematics in Signal Processing},
address = {Birmingham, UK}
} Speaker verification with long-term ageing data
Finnian Kelly, Andrzej Drygajlo, Naomi Harte
2012 5th IAPR International Conference on Biometrics (ICB)
@inproceedings{Kelly2012b,
title = {Speaker verification with long-term ageing data},
author = {Finnian Kelly and Andrzej Drygajlo and Naomi Harte},
year = {2012},
month = {mar},
booktitle = {2012 5th {IAPR} International Conference on Biometrics ({ICB})},
publisher = {Ieee},
doi = {10.1109/icb.2012.6199796},
url = {https://doi.org/10.1109/icb.2012.6199796}
} HRIR Order Reduction Using Approximate Factorization
Claire Masterson, Gavin Kearney, Marcin Gorzel, Frank Boland
IEEE Transactions on Audio, Speech, and Language Processing , vol. 20 , no. 6 , pp. 1808--1817
@article{Masterson2012,
title = {{HRIR} Order Reduction Using Approximate Factorization},
author = {Claire Masterson and Gavin Kearney and Marcin Gorzel and Frank Boland},
year = {2012},
month = {aug},
journal = {IEEE Transactions on Audio, Speech, and Language Processing},
publisher = {Institute of Electrical and Electronics Engineers ({IEEE})},
volume = {20},
number = {6},
pages = {1808--1817},
doi = {10.1109/tasl.2012.2189565},
url = {https://doi.org/10.1109/tasl.2012.2189565}
} A wavelet-based Bayesian framework for 3D object segmentation in microscopy
Kangyu Pan, David Corrigan, Jens Hillebrand, Mani Ramaswami and Anil Kokaram
Three-Dimensional and Multidimensional Microscopy: Image Acquisition and Processing XIX
@inproceedings{Pan2012,
title = {A wavelet-based Bayesian framework for 3D object segmentation in microscopy
},
author = {Kangyu Pan and David Corrigan and Jens Hillebrand and Mani Ramaswami and
Anil Kokaram
},
year = {2012},
month = {feb},
booktitle = {Three-Dimensional and Multidimensional Microscopy: Image Acquisition and
Processing {XIX}
},
publisher = {Spie},
doi = {10.1117/12.908916},
url = {https://doi.org/10.1117/12.908916},
editor = {Jose-Angel Conchello and Carol J. Cogswell and Tony Wilson and Thomas G.
Brown
}
} Stereo video completion for rig and artefact removal
Félix Raimbault, François Pitié, Anil Kokaram
2012 13th International Workshop on Image Analysis for Multimedia Interactive Services
@inproceedings{Raimbault2012a,
title = {Stereo video completion for rig and artefact removal},
author = {F\'{e}lix Raimbault and Fran\c{c}ois Piti\'{e} and Anil Kokaram},
year = {2012},
month = {may},
booktitle = {2012 13th International Workshop on Image Analysis for Multimedia
Interactive Services
},
publisher = {Ieee},
doi = {10.1109/wiamis.2012.6226762},
url = {https://doi.org/10.1109/wiamis.2012.6226762}
} @article{Raimbault2012b,
title = {Stereo-video inpainting},
author = {F\'{e}lix Raimbault},
year = {2012},
month = {feb},
journal = {J. Electron. Imaging},
publisher = {{SPIE}-Intl Soc Optical Eng},
volume = {21},
number = {1},
pages = {011005},
doi = {10.1117/1.jei.21.1.011005},
url = {https://doi.org/10.1117/1.jei.21.1.011005}
} A Ground Truth Bleed-Through Document Image Database
Róisín Rowley-Brooke, François Pitié, Anil Kokaram
Theory and Practice of Digital Libraries , pp. 185--196
@incollection{Rowley_Brooke2012a,
title = {A Ground Truth Bleed-Through Document Image Database},
author = {R\'{o}is\'{\i}n Rowley-Brooke and Fran\c{c}ois Piti\'{e} and Anil Kokaram},
year = {2012},
booktitle = {Theory and Practice of Digital Libraries},
publisher = {Springer Berlin Heidelberg},
pages = {185--196},
doi = {10.1007/978-3-642-33290-6_21},
url = {https://doi.org/10.1007/978-3-642-33290-6_21}
} Bleed-through removal in degraded documents
Róisín Rowley-Brooke, Anil Kokaram
Document Recognition and Retrieval XIX
@inproceedings{Rowley_Brooke2012b,
title = {Bleed-through removal in degraded documents},
author = {R\'{o}is\'{\i}n Rowley-Brooke and Anil Kokaram},
year = {2012},
month = {jan},
booktitle = {Document Recognition and Retrieval {XIX}},
publisher = {Spie},
doi = {10.1117/12.908911},
url = {https://doi.org/10.1117/12.908911},
editor = {Christian Viard-Gaudin and Richard Zanibbi}
} Improving underwater visibility using vignetting correction
Ken Sooknanan, Anil Kokaram, David Corrigan, Gary Baugh, James Wilson et al.
Visual Information Processing and Communication III
@inproceedings{Sooknanan2012a,
title = {Improving underwater visibility using vignetting correction},
author = {Ken Sooknanan and Anil Kokaram and David Corrigan and Gary Baugh and James
Wilson and Naomi Harte
},
year = {2012},
month = {feb},
booktitle = {Visual Information Processing and Communication {III}},
publisher = {Spie},
doi = {10.1117/12.909134},
url = {https://doi.org/10.1117/12.909134},
editor = {Amir Said and Onur G. Guleryuz and Robert L. Stevenson}
} Indexing and selection of well-lit details in underwater video mosaics using vignetting estimation
Ken Sooknanan, Anil Kokaram, David Corrigan, Gary Baugh, Naomi Harte et al.
2012 Oceans - Yeosu
@inproceedings{Sooknanan2012b,
title = {Indexing and selection of well-lit details in underwater video mosaics
using vignetting estimation
},
author = {Ken Sooknanan and Anil Kokaram and David Corrigan and Gary Baugh and Naomi
Harte and James Wilson
},
year = {2012},
month = {may},
booktitle = {2012 Oceans - Yeosu},
publisher = {Ieee},
doi = {10.1109/oceans-yeosu.2012.6263541},
url = {https://doi.org/10.1109/oceans-yeosu.2012.6263541}
} Restoration of high-resolution AFM images captured with broken probes
Y. F. Wang, David Corrigan, C. Forman, Suzanne Jarvis, Anil Kokaram
Three-Dimensional and Multidimensional Microscopy: Image Acquisition and Processing XIX
@inproceedings{Wang2012,
title = {Restoration of high-resolution {AFM} images captured with broken probes},
author = {Y. F. Wang and David Corrigan and C. Forman and Suzanne Jarvis and Anil
Kokaram
},
year = {2012},
month = {feb},
booktitle = {Three-Dimensional and Multidimensional Microscopy: Image Acquisition and
Processing {XIX}
},
publisher = {Spie},
doi = {10.1117/12.906752},
url = {https://doi.org/10.1117/12.906752},
editor = {Jose-Angel Conchello and Carol J. Cogswell and Tony Wilson and Thomas G.
Brown
}
} 2011
Motion Estimation for Regions of Reflections through Layer Separation
Mohamed Abdelaziz Ahmed, François Pitié, Anil Kokaram
2011 Conference for Visual Media Production
@inproceedings{Ahmed2011a,
title = {Motion Estimation for Regions of Reflections through Layer Separation},
author = {Mohamed Abdelaziz Ahmed and Fran\c{c}ois Piti\'{e} and Anil Kokaram},
year = {2011},
month = {nov},
booktitle = {2011 Conference for Visual Media Production},
publisher = {Ieee},
doi = {10.1109/cvmp.2011.12},
url = {https://doi.org/10.1109/cvmp.2011.12}
} Reflection detection in image sequences
Mohamed Abdelaziz Ahmed, François Pitié, Anil Kokaram
Cvpr 2011
@inproceedings{Ahmed2011b,
title = {Reflection detection in image sequences},
author = {Mohamed Abdelaziz Ahmed and Fran\c{c}ois Piti\'{e} and Anil Kokaram},
year = {2011},
month = {jun},
booktitle = {{Cvpr} 2011},
publisher = {Ieee},
doi = {10.1109/cvpr.2011.5995670},
url = {https://doi.org/10.1109/cvpr.2011.5995670}
} An Extended Multiresolution Approach to Mouth Specific AAM Fitting for Speech Recognition
Craig Berry, Anil Kokaram, Naomi Harte
European Signal Processing Conference (Eusipco)
@inproceedings{Berry2011,
title = {An Extended Multiresolution Approach to Mouth Specific {AAM} Fitting for
Speech Recognition
},
author = {Berry, Craig and Kokaram, Anil and Harte, Naomi},
year = {2011},
month = {sep},
booktitle = {European Signal Processing Conference (Eusipco)},
address = {Barcelona, Spain}
} Viseme Definitions Comparison for Visual-Only Speech Recognition
Luca Cappelletta, Naomi Harte
European Signal Processing Conference (Eusipco)
@inproceedings{Cappelletta2011,
title = {Viseme Definitions Comparison for Visual-Only Speech Recognition},
author = {Luca Cappelletta and Naomi Harte},
year = {2011},
month = {sep},
booktitle = {European Signal Processing Conference (Eusipco)},
address = {Barcelona, Spain}
} Restoration of Image Burnout in 3D-Stereoscopic Media Using Inter-View Gradient Interpolation
David Corrigan, François Pitié, Anil Kokaram
European Signal Processing Conference (Eusipco)
@inproceedings{Corrigan2011a,
title = {Restoration of Image Burnout in 3{D}-Stereoscopic Media Using Inter-View
Gradient Interpolation
},
author = {David Corrigan and Fran\c{c}ois Piti\'{e} and Anil Kokaram},
year = {2011},
month = {sep},
booktitle = {European Signal Processing Conference (Eusipco)},
address = {Barcelona, Spain}
} Restoring Image Burnout in 3D-Stereoscopic Media using Temporally Consistent Disparity Maps
David Corrigan, François Pitié, Anil Kokaram
Irish Signals and Systems Conference
@inproceedings{Corrigan2011b,
title = {Restoring Image Burnout in 3{D}-Stereoscopic Media using Temporally
Consistent Disparity Maps
},
author = {David Corrigan and Fran\c{c}ois Piti\'{e} and Anil Kokaram},
year = {2011},
month = {jun},
booktitle = {Irish Signals and Systems Conference},
address = {Dublin, Ireland}
} Handling Transparency in Digital Video
Mohamed A. Elgharib
@phdthesis{Elgharib2011,
title = {Handling Transparency in Digital Video},
author = {Mohamed A. Elgharib},
year = {2011},
school = {Trinity College Dublin}
} On the Perception of Dynamic Sound Sources in Ambisonic Binaural Renderings
Marcin Gorzel, Gavin Kearney, Henry Rice, Frank Boland
AES 41st International Conference
@inproceedings{Gorzel2011,
title = {On the Perception of Dynamic Sound Sources in Ambisonic Binaural Renderings
},
author = {Marcin Gorzel and Gavin Kearney and Henry Rice and Frank Boland},
year = {2011},
month = {feb},
booktitle = {AES 41st International Conference},
address = {London, UK},
organization = {Aes}
} Comparing hearing aid algorithm performance using Simulated Performance Intensity Functions
Andrew Hines, Naomi Harte
Speech perception and auditory disorders, Int. Symposium on Audiological and Auditory Research (ISAAR)
@inproceedings{Hines2011a,
title = {Comparing hearing aid algorithm performance using Simulated Performance
Intensity Functions
},
author = {Andrew Hines and Naomi Harte},
year = {2011},
month = {aug},
booktitle = {Speech perception and auditory disorders, Int. Symposium on Audiological
and Auditory Research (ISAAR)
},
address = {Nyborg, Denmark}
} Reproduction of the performance/intensity function using image processing and a computational model (A)
Andrew Hines, Naomi Harte
Int J Audiol , vol. 50 , no. 10 , pp. 723
@article{Hines2011b,
title = {Reproduction of the performance/intensity function using image processing
and a computational model ({A})
},
author = {Andrew Hines and Naomi Harte},
year = {2011},
journal = {Int J Audiol},
volume = {50},
number = {10},
pages = {723},
doi = {doi:10.3109/14992027.2011.588967},
url = {http://dx.doi.org/10.3109/14992027.2011.588967}
} Simulated performance intensity functions
Andrew Hines, Naomi Harte
2011 Annual International Conference of the IEEE Engineering in Medicine and Biology Society
@inproceedings{Hines2011c,
title = {Simulated performance intensity functions},
author = {Andrew Hines and Naomi Harte},
year = {2011},
month = {aug},
booktitle = {2011 Annual International Conference of the {IEEE} Engineering in Medicine
and Biology Society
},
publisher = {Ieee},
doi = {10.1109/iembs.2011.6091804},
url = {https://doi.org/10.1109/iembs.2011.6091804}
} Real-time walkthrough auralisation of the acoustics of Christ Church cathedral Dublin
Gavin Kearney, Marcin Gorzel, Frank Boland, F. Smyth, D. Lennon et al.
Proc of the Institute of Acoustics , vol. 33 , pp. 244--258
@inproceedings{Kearney2011,
title = {Real-time walkthrough auralisation of the acoustics of Christ Church
cathedral Dublin
},
author = {Gavin Kearney and Marcin Gorzel and Frank Boland and F. Smyth and D. Lennon
and Henry Rice
},
year = {2011},
booktitle = {Proc of the Institute of Acoustics},
address = {Uk},
volume = {33},
pages = {244--258},
organization = {Ioa}
} Effects of Long-Term Ageing on Speaker Verification
Finnian Kelly, Naomi Harte
Lecture Notes in Computer Science , pp. 113--124
@incollection{Kelly2011,
title = {Effects of Long-Term Ageing on Speaker Verification},
author = {Finnian Kelly and Naomi Harte},
year = {2011},
booktitle = {Lecture Notes in Computer Science},
publisher = {Springer Berlin Heidelberg},
pages = {113--124},
doi = {10.1007/978-3-642-19530-3_11},
url = {https://doi.org/10.1007/978-3-642-19530-3_11}
} Cellsnake: A new active contour technique for cell/fibre segmentation
Kangyu Pan, Anil Kokaram, Kerry Gilmore, Michael J. Higgins and Robert Kapsa, Gordon G. Wallace
2011 18th IEEE International Conference on Image Processing
@inproceedings{Pan2011,
title = {Cellsnake: A new active contour technique for cell/fibre segmentation},
author = {Kangyu Pan and Anil Kokaram and Kerry Gilmore and Michael J. Higgins and
Robert Kapsa and Gordon G. Wallace
},
year = {2011},
month = {sep},
booktitle = {2011 18th {IEEE} International Conference on Image Processing},
publisher = {Ieee},
doi = {10.1109/icip.2011.6116037},
url = {https://doi.org/10.1109/icip.2011.6116037}
} Stereo video inpainting
Félix Raimbault, Anil Kokaram
Stereoscopic Displays and Applications XXII
@inproceedings{Raimbault2011,
title = {Stereo video inpainting},
author = {F\'{e}lix Raimbault and Anil Kokaram},
year = {2011},
month = {feb},
booktitle = {Stereoscopic Displays and Applications {XXII}},
publisher = {Spie},
doi = {10.1117/12.872465},
url = {https://doi.org/10.1117/12.872465},
editor = {Andrew J. Woods and Nicolas S. Holliman and Neil A. Dodgson}
} Bleed-Through Removal in Degraded Manuscripts
Róisín Rowley-Brooke, Anil Kokaram
Irish Signals and Systems Conference
@inproceedings{Rowley_Brooke2011a,
title = {Bleed-Through Removal in Degraded Manuscripts},
author = {R\'{o}is\'{\i}n Rowley-Brooke and Anil Kokaram},
year = {2011},
booktitle = {Irish Signals and Systems Conference},
address = {Trinity College, Dublin, Ireland}
} Degraded Document Bleed-Through Removal
Róisín Rowley-Brooke, Anil Kokaram
2011 Irish Machine Vision and Image Processing Conference
@inproceedings{Rowley_Brooke2011b,
title = {Degraded Document Bleed-Through Removal},
author = {R\'{o}is\'{\i}n Rowley-Brooke and Anil Kokaram},
year = {2011},
month = {sep},
booktitle = {2011 Irish Machine Vision and Image Processing Conference},
publisher = {Ieee},
doi = {10.1109/imvip.2011.21},
url = {https://doi.org/10.1109/imvip.2011.21}
} 2010
Semi-automatic motion based segmentation using long term motion trajectories
Gary Baugh, Anil Kokaram
2010 IEEE International Conference on Image Processing
@inproceedings{Baugh2010,
title = {Semi-automatic motion based segmentation using long term motion
trajectories
},
author = {Gary Baugh and Anil Kokaram},
year = {2010},
month = {sep},
booktitle = {2010 {IEEE} International Conference on Image Processing},
publisher = {Ieee},
doi = {10.1109/icip.2010.5653946},
url = {https://doi.org/10.1109/icip.2010.5653946}
} Nostril detection for robust mouth tracking
Luca Cappelletta, Naomi Harte
IET Irish Signals and Systems Conference (ISSC 2010)
@inproceedings{Cappelletta2010,
title = {Nostril detection for robust mouth tracking},
author = {Luca Cappelletta and Naomi Harte},
year = {2010},
booktitle = {{IET} Irish Signals and Systems Conference ({ISSC} 2010)},
publisher = {Iet},
doi = {10.1049/cp.2010.0519},
url = {https://doi.org/10.1049/cp.2010.0519}
} A Video Database for the Development of Stereo-3D Post-Production Algorithms
David Corrigan, François Pitié, Valerie Morris, Andrew Rankin, M. Linnane et al.
2010 Conference on Visual Media Production
@inproceedings{Corrigan2010,
title = {A Video Database for the Development of Stereo-3D Post-Production
Algorithms
},
author = {David Corrigan and Fran\c{c}ois Piti\'{e} and Valerie Morris and Andrew
Rankin and M. Linnane and Gavin Kearney and Marcin Gorzel and M. O'Dea and
C. Lee and Anil Kokaram
},
year = {2010},
month = {nov},
booktitle = {2010 Conference on Visual Media Production},
publisher = {Ieee},
doi = {10.1109/cvmp.2010.16},
url = {https://doi.org/10.1109/cvmp.2010.16}
} Evaluating Sensorineural Hearing Loss With An Auditory Nerve Model Using: A Mean Structural Similarity Measure
Andrew Hines, Naomi Harte
European Signal Processing Conference (EUSIPCO '10)
@inproceedings{Hines2010a,
title = {Evaluating Sensorineural Hearing Loss With An Auditory Nerve Model Using: A
Mean Structural Similarity Measure
},
author = {Andrew Hines and Naomi Harte},
year = {2010},
month = {aug},
booktitle = {European Signal Processing Conference (EUSIPCO '10)},
address = {Aalborg, Denmark}
} Speech intelligibility from image processing
Andrew Hines, Naomi Harte
Speech Communication , vol. 52 , no. 9 , pp. 736--752
@article{Hines2010b,
title = {Speech intelligibility from image processing},
author = {Andrew Hines and Naomi Harte},
year = {2010},
month = {sep},
journal = {Speech Communication},
publisher = {Elsevier {BV}},
volume = {52},
number = {9},
pages = {736--752},
doi = {10.1016/j.specom.2010.04.006},
url = {https://doi.org/10.1016/j.specom.2010.04.006}
} Depth perception in interactive virtual acoustic environments using higher order ambisonic soundfields
Gavin Kearney, Marcin Gorzel, H. Rice, Frank Boland
2nd International Ambisonics and Spherical Acoustics Symposium
@inproceedings{Kearney2010,
title = {Depth perception in interactive virtual acoustic environments using higher
order ambisonic soundfields
},
author = {Gavin Kearney and Marcin Gorzel and H. Rice and Frank Boland},
year = {2010},
month = {may},
booktitle = {2nd International Ambisonics and Spherical Acoustics Symposium},
address = {Paris, France}
} A Comparison of Auditory Features for Robust Speech Recognition
Finnian Kelly, Naomi Harte
European Signal Processing Conference (EUSIPCO '10)
@inproceedings{Kelly2010a,
title = {A Comparison of Auditory Features for Robust Speech Recognition},
author = {Finnian Kelly and Naomi Harte},
year = {2010},
month = {aug},
booktitle = {European Signal Processing Conference (EUSIPCO '10)},
address = {Aalborg, Denmark}
} Auditory Features Revisited for Robust Speech Recognition
Finnian Kelly, Naomi Harte
2010 20th International Conference on Pattern Recognition
@inproceedings{Kelly2010b,
title = {Auditory Features Revisited for Robust Speech Recognition},
author = {Finnian Kelly and Naomi Harte},
year = {2010},
month = {aug},
booktitle = {2010 20th International Conference on Pattern Recognition},
publisher = {Ieee},
doi = {10.1109/icpr.2010.1082},
url = {https://doi.org/10.1109/icpr.2010.1082}
} Training GMMs for speaker verification
Finnian Kelly, Naomi Harte
IET Irish Signals and Systems Conference (ISSC 2010)
@inproceedings{Kelly2010c,
title = {Training {GMMs} for speaker verification},
author = {Finnian Kelly and Naomi Harte},
year = {2010},
booktitle = {{IET} Irish Signals and Systems Conference ({ISSC} 2010)},
publisher = {Iet},
doi = {10.1049/cp.2010.0506},
url = {https://doi.org/10.1049/cp.2010.0506}
} HRIR Factorisation: A Regularised Approach
C. Masterson, Gavin Kearney, Frank Boland
Euspico 2010 , vol. 2 , pp. 751--755
@inproceedings{Masterson2010a,
title = {{HRIR} Factorisation: {A} Regularised Approach},
author = {C. Masterson and Gavin Kearney and Frank Boland},
year = {2010},
month = {aug},
booktitle = {Euspico 2010},
address = {Aalborg, Denmark},
volume = {2},
pages = {751--755},
organization = {Eurasip}
} Optimised virtual loudspeaker reproduction
C. Masterson, Gavin Kearney, Marcin Gorzel, H. Rice, Frank Boland
IET Irish Signals and Systems Conference (ISSC 2010)
@inproceedings{Masterson2010b,
title = {Optimised virtual loudspeaker reproduction},
author = {C. Masterson and Gavin Kearney and Marcin Gorzel and H. Rice and Frank
Boland
},
year = {2010},
booktitle = {{IET} Irish Signals and Systems Conference ({ISSC} 2010)},
publisher = {Iet},
doi = {10.1049/cp.2010.0493},
url = {https://doi.org/10.1049/cp.2010.0493}
} Content-Based Media Processing
Deirdre O'Regan
@phdthesis{O_Regan2010,
title = {Content-Based Media Processing},
author = {Deirdre O'Regan},
year = {2010},
school = {Trinity College Dublin}
} Gaussian mixture models for spots in microscopy using a new split/merge em algorithm
Kangyu Pan, Anil Kokaram, Jens Hillebrand, Mani Ramaswami
2010 IEEE International Conference on Image Processing
@inproceedings{Pan2010a,
title = {Gaussian mixture models for spots in microscopy using a new split/merge em
algorithm
},
author = {Kangyu Pan and Anil Kokaram and Jens Hillebrand and Mani Ramaswami},
year = {2010},
month = {sep},
booktitle = {2010 {IEEE} International Conference on Image Processing},
publisher = {Ieee},
doi = {10.1109/icip.2010.5652472},
url = {https://doi.org/10.1109/icip.2010.5652472}
} Gaussian Mixtures for Intensity Modeling of Spots in Microscopy
Kangyu Pan, Jens Hillebrand, Mani Ramaswami, Anil Kokaram
International Symposium on Biomedical Imaging (ISBI'10) , pp. 121--124
@inproceedings{Pan2010b,
title = {Gaussian Mixtures for Intensity Modeling of Spots in Microscopy},
author = {Kangyu Pan and Jens Hillebrand and Mani Ramaswami and Anil Kokaram},
year = {2010},
month = {feb},
booktitle = {International Symposium on Biomedical Imaging (ISBI'10)},
publisher = {Ieee},
address = {Rotterdam, Netherlands},
pages = {121--124},
doi = {10.1109/isbi.2010.5490398},
url = {https://doi.org/10.1109/isbi.2010.5490398}
} Matting with a depth map
François Pitié, Anil Kokaram
2010 IEEE International Conference on Image Processing
@inproceedings{Piti_e2010,
title = {Matting with a depth map},
author = {Fran\c{c}ois Piti\'{e} and Anil Kokaram},
year = {2010},
month = {sep},
booktitle = {2010 {IEEE} International Conference on Image Processing},
publisher = {Ieee},
doi = {10.1109/icip.2010.5653548},
url = {https://doi.org/10.1109/icip.2010.5653548}
} 2008
@inbook{Piti_e2008,
author = {Piti\'{e}, Fran\c{c}ois and Kokaram, Anil and Dahyot, Rozenn},
year = {2008},
month = {sep},
day = {9},
publisher = {CRC Press},
series = {Image Processing Series},
pages = {295--321},
doi = {10.1201/9781420054538.ch11},
isbn = {978-1-4200-5452-1},
url = {http://dx.doi.org/10.1201/9781420054538.ch11},
note = {0},
chapter = {Enhancement of Digital Photographs Using Color Transfer Techniques},
demo = {https://github.com/frcs/colour-transfer}
} No publications found matching your search.