2023
Artículos de revista
Mingote, Victoria; Gimeno, Pablo; Vicente, Luis; Khurana, Sameer; Laurent, Antoine; Duret, Jarod
Direct Text to Speech Translation System Using Acoustic Units Artículo de revista
En: IEEE Signal Processing Letters, vol. 30, pp. 1262-1266, 2023.
@article{Mingote2023Units,
title = {Direct Text to Speech Translation System Using Acoustic Units},
author = {Victoria Mingote and Pablo Gimeno and Luis Vicente and Sameer Khurana and Antoine Laurent and Jarod Duret},
doi = {10.1109/LSP.2023.3313513},
year = {2023},
date = {2023-09-14},
journal = {IEEE Signal Processing Letters},
volume = {30},
pages = {1262-1266},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Mingote, Victoria; Miguel, Antonio; Ortega, Alfonso; Lleida, Eduardo
Class token and knowledge distillation for multi-head self-attention speaker verification systems Artículo de revista
En: Digital Signal Processing, vol. 133, pp. 103859, 2023.
@article{nokey,
title = {Class token and knowledge distillation for multi-head self-attention speaker verification systems},
author = {Victoria Mingote and Antonio Miguel and Alfonso Ortega and Eduardo Lleida},
doi = {10.1016/j.dsp.2022.103859},
year = {2023},
date = {2023-03-01},
urldate = {2022-12-01},
journal = {Digital Signal Processing},
volume = {133},
pages = {103859},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Ribas, Dayana; Pastor, Miguel; Miguel, Antonio; Martínez, David; Ortega, Alfonso; Lleida, Eduardo
Automatic Voice Disorder Detection using Self-Supervised Representations Artículo de revista
En: IEEE Access, vol. 11, pp. 14915-14927, 2023.
@article{Ribas2023,
title = {Automatic Voice Disorder Detection using Self-Supervised Representations},
author = {Dayana Ribas and Miguel Pastor and Antonio Miguel and David Martínez and Alfonso Ortega and Eduardo Lleida},
doi = {10.1109/ACCESS.2023.3243986},
year = {2023},
date = {2023-02-10},
urldate = {2023-02-10},
journal = {IEEE Access},
volume = {11},
pages = {14915-14927},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Conferencias
Ribas, Dayana; Miguel, Antonio; Ortega, Alfonso; Lleida, Eduardo
On the Problem of Data Availability in Automatic Voice Disorder Detection. Conferencia
Proceedings of the 16th International Joint Conference on Biomedical Engineering Systems and Technologies (BIOSTEC 2023) – Volume 5: HEALTHINF, 2023, ISBN: 978-989-758-631-6.
@conference{Ribas2023b,
title = {On the Problem of Data Availability in Automatic Voice Disorder Detection.},
author = {Dayana Ribas and Antonio Miguel and Alfonso Ortega and Eduardo Lleida},
isbn = {978-989-758-631-6},
year = {2023},
date = {2023-02-13},
urldate = {2023-02-13},
booktitle = {Proceedings of the 16th International Joint Conference on Biomedical Engineering Systems and Technologies (BIOSTEC 2023) - Volume 5: HEALTHINF},
pages = {330-337},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
2022
Artículos de revista
Ribas, Dayana; Miguel, Antonio; Ortega, Alfonso; Lleida, Eduardo
Wiener Filter and Deep Neural Networks: A Well-Balanced Pair for Speech Enhancement Artículo de revista
En: Applied Sciences, vol. 12, no 18, pp. 9000, 2022.
@article{Ribas2022,
title = {Wiener Filter and Deep Neural Networks: A Well-Balanced Pair for Speech Enhancement},
author = {Dayana Ribas and Antonio Miguel and Alfonso Ortega and Eduardo Lleida},
doi = {10.3390/app12189000},
year = {2022},
date = {2022-09-07},
journal = {Applied Sciences},
volume = {12},
number = {18},
pages = {9000},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Almudévar, Antonio; Sevillano, Pascual; Vicente, Luis; Preciado-Garbayo, Javier; Ortega, Alfonso
Unsupervised Anomaly Detection Applied to Φ-OTDR Artículo de revista
En: Sensors, vol. 22, no 17, pp. 6515, 2022.
@article{Almudevar2022,
title = {Unsupervised Anomaly Detection Applied to Φ-OTDR},
author = {Antonio Almudévar and Pascual Sevillano and Luis Vicente and Javier Preciado-Garbayo and Alfonso Ortega},
doi = {10.3390/s22176515},
year = {2022},
date = {2022-08-29},
urldate = {2022-08-29},
journal = {Sensors},
volume = {22},
number = {17},
pages = {6515},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Prieto, Santi; Ortega, Alfonso; López-Espejo, Iván; Lleida, Eduardo
Shouted and whispered speech compensation for speaker verification systems Artículo de revista
En: Digital Signal Processing, vol. 127, pp. 103536, 2022.
@article{Prieto2022,
title = {Shouted and whispered speech compensation for speaker verification systems},
author = {Santi Prieto and Alfonso Ortega and Iván López-Espejo and Eduardo Lleida},
doi = {10.1016/j.dsp.2022.103536},
year = {2022},
date = {2022-07-01},
journal = {Digital Signal Processing},
volume = {127},
pages = {103536},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Gimeno, Pablo; Ribas, Dayana; Ortega, Alfonso; Miguel, Antonio; Lleida, Eduardo
Unsupervised Adaptation of Deep Speech Activity Detection Models to Unseen Domains Artículo de revista
En: Applied Sciences, vol. 12, no 4, pp. 1832, 2022.
@article{Gimeno2022,
title = {Unsupervised Adaptation of Deep Speech Activity Detection Models to Unseen Domains},
author = {Pablo Gimeno and Dayana Ribas and Alfonso Ortega and Antonio Miguel and Eduardo Lleida},
doi = {10.3390/app12041832},
year = {2022},
date = {2022-02-10},
urldate = {2022-02-10},
journal = {Applied Sciences},
volume = {12},
number = {4},
pages = {1832},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Mingote, Victoria; Miguel, Antonio; Ribas, Dayana; Ortega, Alfonso; Lleida, Eduardo
aDCF Loss Function for Deep Metric Learning in End-to-End Text-Dependent Speaker Verification Systems Artículo de revista
En: IEEE/ACM Transactions on Audio, Speech, and Language Processing, vol. 30, pp. 772-784, 2022.
@article{Mingote2022b,
title = {aDCF Loss Function for Deep Metric Learning in End-to-End Text-Dependent Speaker Verification Systems},
author = {Victoria Mingote and Antonio Miguel and Dayana Ribas and Alfonso Ortega and Eduardo Lleida},
doi = {10.1109/TASLP.2022.3145307},
year = {2022},
date = {2022-01-25},
urldate = {2022-01-25},
journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
volume = {30},
pages = {772-784},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Mingote, Victoria; Viñals, Ignacio; Gimeno, Pablo; Miguel, Antonio; Ortega, Alfonso; Lleida, Eduardo
Multimodal Diarization Systems by Training Enrollment Models as Identity Representations Artículo de revista
En: Applied Sciences, vol. 12, no 3, pp. 1141, 2022.
@article{Mingote2022,
title = {Multimodal Diarization Systems by Training Enrollment Models as Identity Representations},
author = {Victoria Mingote and Ignacio Viñals and Pablo Gimeno and Antonio Miguel and Alfonso Ortega and Eduardo Lleida},
doi = {10.3390/app12031141},
year = {2022},
date = {2022-01-21},
urldate = {2022-01-21},
journal = {Applied Sciences},
volume = {12},
number = {3},
pages = {1141},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Conferencias
Gimeno, Pablo; Ortega, Alfonso; Miguel, Antonio; Lleida, Eduardo
A Study on the Use of wav2vec Representations for Multiclass Audio Segmentation Conferencia
Proceedings of XII Jornadas en Tecnología del Habla and VIII Iberian SLTech (Iberspeech), 2022.
@conference{Gimeno2022b,
title = {A Study on the Use of wav2vec Representations for Multiclass Audio Segmentation},
author = {Pablo Gimeno and Alfonso Ortega and Antonio Miguel and Eduardo Lleida},
doi = {10.21437/IberSPEECH.2022-12},
year = {2022},
date = {2022-11-14},
urldate = {2022-11-14},
booktitle = {Proceedings of XII Jornadas en Tecnología del Habla and VIII Iberian SLTech (Iberspeech)},
pages = {56--60},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Pastor, Miguel; Ribas, Dayana; Ortega, Alfonso; Miguel, Antonio; Lleida, Eduardo
Cross-Corpus Speech Emotion Recognition with HuBERT Self-Supervised Representation Conferencia
Proceedings of XII Jornadas en Tecnología del Habla and VIII Iberian SLTech (Iberspeech), 2022.
@conference{Pastor2022,
title = {Cross-Corpus Speech Emotion Recognition with HuBERT Self-Supervised Representation},
author = {Miguel Pastor and Dayana Ribas and Alfonso Ortega and Antonio Miguel and Eduardo Lleida},
doi = {10.21437/IberSPEECH.2022-16},
year = {2022},
date = {2022-11-14},
urldate = {2022-11-14},
booktitle = {Proceedings of XII Jornadas en Tecnología del Habla and VIII Iberian SLTech (Iberspeech)},
pages = {76--80},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Ribas, Dayana; Pastor, Miguel; Miguel, Antonio; Martínez, David; Ortega, Alfonso; Lleida, Eduardo
S3prl-Disorder: Open-Source Voice Disorder Detection System based in the Framework of S3PRL-toolkit Conferencia
Proceedings of XII Jornadas en Tecnología del Habla and VIII Iberian SLTech (Iberspeech), 2022.
@conference{Ribas2022b,
title = {S3prl-Disorder: Open-Source Voice Disorder Detection System based in the Framework of S3PRL-toolkit},
author = {Dayana Ribas and Miguel Pastor and Antonio Miguel and David Martínez and Alfonso Ortega and Eduardo Lleida},
doi = {10.21437/IberSPEECH.2022-28},
year = {2022},
date = {2022-11-14},
booktitle = {Proceedings of XII Jornadas en Tecnología del Habla and VIII Iberian SLTech (Iberspeech)},
pages = {136--140},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Miguel, Antonio; Ortega, Alfonso; Lleida, Eduardo
ViVoLAB System Description for the S2TC IberSPEECH-RTVE 2022 challenge Conferencia
Proceedings of XII Jornadas en Tecnología del Habla and VIII Iberian SLTech (Iberspeech), 2022.
@conference{Miguel2022,
title = {ViVoLAB System Description for the S2TC IberSPEECH-RTVE 2022 challenge},
author = {Antonio Miguel and Alfonso Ortega and Eduardo Lleida},
year = {2022},
date = {2022-11-14},
urldate = {2022-11-14},
booktitle = {Proceedings of XII Jornadas en Tecnología del Habla and VIII Iberian SLTech (Iberspeech)},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Mingote, Victoria; Miguel, Antonio
Representation and Metric Learning Advances for Deep Neural Network Face and Speaker Biometric Systems Conferencia
Proceedings of XII Jornadas en Tecnología del Habla and VIII Iberian SLTech (Iberspeech), 2022.
@conference{Mingote2022c,
title = {Representation and Metric Learning Advances for Deep Neural Network Face and Speaker Biometric Systems},
author = {Victoria Mingote and Antonio Miguel},
doi = {10.21437/IberSPEECH.2022-43},
year = {2022},
date = {2022-11-14},
urldate = {2022-11-14},
booktitle = {Proceedings of XII Jornadas en Tecnología del Habla and VIII Iberian SLTech (Iberspeech)},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
2021
Artículos de revista
Viñals, Ignacio; Ortega, Alfonso; Miguel, Antonio; Lleida, Eduardo
The Domain Mismatch Problem in the Broadcast Speaker Attribution Task Artículo de revista
En: Applied Sciences, vol. 11, no 18, pp. 8521, 2021.
@article{Viñals2021,
title = {The Domain Mismatch Problem in the Broadcast Speaker Attribution Task},
author = {Ignacio Viñals and Alfonso Ortega and Antonio Miguel and Eduardo Lleida},
doi = {10.3390/app11188521},
year = {2021},
date = {2021-09-15},
journal = {Applied Sciences},
volume = {11},
number = {18},
pages = {8521},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Gimeno, Pablo; Mingote, Victoria; Ortega, Alfonso; Miguel, Antonio; Lleida, Eduardo
Generalising AUC Optimisation to Multiclass Classification for Audio Segmentation with Limited Training Data Artículo de revista
En: IEEE Signal Processing Letters, vol. 28, pp. 1135-1139, 2021.
@article{Gimeno2021auc,
title = {Generalising AUC Optimisation to Multiclass Classification for Audio Segmentation with Limited Training Data},
author = {Pablo Gimeno and Victoria Mingote and Alfonso Ortega and Antonio Miguel and Eduardo Lleida},
doi = {10.1109/LSP.2021.3084501},
year = {2021},
date = {2021-05-27},
journal = {IEEE Signal Processing Letters},
volume = {28},
pages = {1135-1139},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Llombart, Jorge; Ribas, Dayana; Miguel, Antonio; Vicente, Luis; Ortega, Alfonso; Lleida, Eduardo
Progressive Loss Functions for Speech Enhancement with Deep Neural Networks Artículo de revista
En: EURASIP Journal on Audio, Speech, and Music Processing, vol. 2021, no 1, pp. 1-16, 2021.
@article{Llombart2021,
title = {Progressive Loss Functions for Speech Enhancement with Deep Neural Networks},
author = {Jorge Llombart and Dayana Ribas and Antonio Miguel and Luis Vicente and Alfonso Ortega and Eduardo Lleida},
doi = {10.1186/s13636-020-00191-3},
year = {2021},
date = {2021-01-01},
journal = {EURASIP Journal on Audio, Speech, and Music Processing},
volume = {2021},
number = {1},
pages = {1-16},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Conferencias
Gimeno, Pablo; Ortega, Alfonso; Miguel, Antonio; Lleida, Eduardo
Unsupervised Representation Learning for Speech Activity Detection in the Fearless Steps Challenge 2021 Conferencia
Proceedings of the Annual Conference of the International Speech Communication Association (INTERSPEECH), vol. 2021-September, 2021.
@conference{Gimeno2021,
title = {Unsupervised Representation Learning for Speech Activity Detection in the Fearless Steps Challenge 2021},
author = {Pablo Gimeno and Alfonso Ortega and Antonio Miguel and Eduardo Lleida},
doi = {10.21437/Interspeech.2021-309},
year = {2021},
date = {2021-09-06},
booktitle = {Proceedings of the Annual Conference of the International Speech Communication Association (INTERSPEECH)},
volume = {2021-September},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}
Mingote, Victoria; Miguel, Antonio; Ortega, Alfonso; Lleida, Eduardo
Log-Likelihood-Ratio Cost Function as Objective Loss for Speaker Verification Systems Conferencia
Proceedings of the Annual Conference of the International Speech Communication Association (INTERSPEECH), vol. 2021-September, 2021.
@conference{Mingote2021_cllr,
title = {Log-Likelihood-Ratio Cost Function as Objective Loss for Speaker Verification Systems},
author = {Victoria Mingote and Antonio Miguel and Alfonso Ortega and Eduardo Lleida},
doi = {10.21437/Interspeech.2021-1085},
year = {2021},
date = {2021-09-01},
booktitle = {Proceedings of the Annual Conference of the International Speech Communication Association (INTERSPEECH)},
volume = {2021-September},
keywords = {},
pubstate = {published},
tppubtype = {conference}
}