Journals


Authors: Type:

2020

  • [DOI] F. J. Valverde-Albacete and C. Peláez-Moreno, “A framework for supervised classification performance analysis with information-theoretic methods,” IEEE Transactions on Knowledge and Data Engineering, pp. 1-1, 2020.
    [Bibtex]
    @ARTICLE{val:pel:20,
    author={F. J. {Valverde-Albacete} and C. {Peláez-Moreno}},
    journal={IEEE Transactions on Knowledge and Data Engineering},
    title={A framework for supervised classification performance analysis with information-theoretic methods},
    year={2020},
    volume={},
    number={},
    pages={1-1},
    keywords={Task analysis;Entropy;Mutual information;Proposals;Tools;Performance analysis;Performance evaluation;classification algorithms;information entropy;mutual information;formal concept analysis},
    doi={10.1109/TKDE.2019.2915643},
    ISSN={2326-3865},
    month={},}

2019

  • [DOI] E. Pla-Sacristán, I. González-Díaz, T. Martínez-Cortés, and F. Díaz-de-María, “Finding landmarks within settled areas using hierarchical density-based clustering and meta-data from publicly available images,” Expert Systems with Applications, vol. 123, pp. 315-327, 2019.
    [Bibtex]
    @article{pla:gon:mar:dia:19,
    title = "Finding landmarks within settled areas using hierarchical density-based clustering and meta-data from publicly available images",
    journal = "Expert Systems with Applications",
    volume = "123",
    pages = "315 - 327",
    year = "2019",
    issn = "0957-4174",
    doi = "https://doi.org/10.1016/j.eswa.2019.01.046",
    url = "http://www.sciencedirect.com/science/article/pii/S0957417419300521",
    author = "Eduardo Pla-Sacristán and Iván González-Díaz and Tomás Martínez-Cortés and Fernando Díaz-de-María",
    keywords = "Density-based clustering, K-DBSCAN, V-DBSCAN, Hierarchical clustering, Landmark detection, Tourism",
    abstract = "The process of determining relevant landmarks within a certain region is a challenging task, mainly due to its subjective nature. Many of the current lines of work include the use of density-based clustering algorithms as the base tool for such a task, as they permit the generation of clusters of different shapes and sizes. However, there are still important challenges, such as the variability in scale and density. In this paper, we present two novel density-based clustering algorithms that can be applied to solve this: K-DBSCAN, a clustering algorithm based on Gaussian Kernels used to detect individual inhabited cores within regions; and V-DBSCAN, a hierarchical algorithm suitable for sample spaces with variable density, which is used to attempt the discovery of relevant landmarks in cities or regions. The obtained results are outstanding, since the system properly identifies most of the main touristic attractions within a certain region under analysis. A comparison with respect to the state-of-the-art show that the presented method clearly outperforms the current methods devoted to solve this problem."
    }
  • [DOI] M. Fernández-Torres, I. González-Díaz, and F. Díaz-de-María, “Probabilistic Topic Model for Context-Driven Visual Attention Understanding,” IEEE Transactions on Circuits and Systems for Video Technology, pp. 1-1, 2019.
    [Bibtex]
    @ARTICLE{tor:gon:dia:19,
    author={M. {Fernández-Torres} and I. {González-Díaz} and F. {Díaz-de-María}},
    journal={IEEE Transactions on Circuits and Systems for Video Technology},
    title={Probabilistic Topic Model for Context-Driven Visual Attention Understanding},
    year={2019},
    volume={},
    number={},
    pages={1-1},
    keywords={Visualization;Task analysis;Adaptation models;Feature extraction;Computational modeling;Probabilistic logic;Context modeling;Top-down visual attention;hierarchical probabilistic framework;context-aware model;latent topic models},
    doi={10.1109/TCSVT.2019.2909427},
    ISSN={1558-2205},
    month={},}
  • [DOI] I. González-Díaz, J. Benois-Pineau, J. Domenger, D. Cattaert, and A. de Rugy, “Perceptually-guided deep neural networks for ego-action prediction: Object grasping,” Pattern Recognition, vol. 88, pp. 223-235, 2019.
    [Bibtex]
    @article{Gonzalez2019,
    title = "Perceptually-guided deep neural networks for ego-action prediction: Object grasping",
    journal = "Pattern Recognition",
    volume = "88",
    pages = "223 - 235",
    year = "2019",
    issn = "0031-3203",
    doi = "https://doi.org/10.1016/j.patcog.2018.11.013",
    url = "http://www.sciencedirect.com/science/article/pii/S0031320318304011",
    author = "I. González-Díaz and Jenny Benois-Pineau and Jean-Philippe Domenger and Daniel Cattaert and Aymar de Rugy",
    keywords = "Human perception, Grasping action prediction, Weakly supervised active object detection"
    }
  • [DOI] F. J. Valverde-Albacete and C. Peláez-Moreno, “The Case for Shifting the Rényi Entropy,” Entropy, vol. 21, iss. 1, 2019.
    [Bibtex]
    @Article{val:pel:19,
    AUTHOR = {Valverde-Albacete, Francisco J. and Peláez-Moreno, Carmen},
    TITLE = {The Case for Shifting the Rényi Entropy},
    JOURNAL = {Entropy},
    VOLUME = {21},
    YEAR = {2019},
    NUMBER = {1},
    ARTICLE-NUMBER = {46},
    URL = {http://www.mdpi.com/1099-4300/21/1/46},
    ISSN = {1099-4300},
    ABSTRACT = {We introduce a variant of the R\´enyi entropy definition that aligns it with the well-known H\"older mean: in the new formulation, the r-th order Renyi Entropy is the logarithm of the inverse of the r-th order H\"older mean. This brings about new insights into the relationship of the R\´enyi entropy to quantities close to it, like the information potential and the partition function of statistical mechanics. We also provide expressions that allow us to calculate the R\' enyi entropies from the Shannon cross-entropy and the escort probabilities. Finally, we discuss why shifting the R\`enyi entropy is fruitful in some applications.},
    DOI = {10.3390/e21010046}
    }

2018

  • [DOI] K. A. Abdalmalak and A. Gallardo-Antolín, “Enhancement of a text-independent speaker verification system by using feature combination and parallel structure classifiers,” Neural Computing and Applications, vol. 29, iss. 3, pp. 637-651, 2018.
    [Bibtex]
    @article{Abdalmalak2018,
    author="Abdalmalak, Kerlos Atia and Gallardo-Antol{\'i}n, Ascensi{\'o}n",
    title="Enhancement of a text-independent speaker verification system by using feature combination and parallel structure classifiers",
    journal="Neural Computing and Applications",
    year="2018",
    month="Feb",
    day="01",
    volume="29",
    number="3",
    pages="637--651",
    issn="1433-3058",
    doi="10.1007/s00521-016-2470-x",
    url="https://doi.org/10.1007/s00521-016-2470-x"
    }
  • [DOI] M. Molina-Moreno, I. González-Díaz, and F. Díaz-de-María, “Efficient Scale-Adaptive License Plate Detection System,” IEEE Transactions on Intelligent Transportation Systems, pp. 1-13, 2018.
    [Bibtex]
    @ARTICLE{Molina-Moreno2018, 
    author={M. Molina-Moreno and I. González-Díaz and F. Díaz-de-María}, 
    journal={IEEE Transactions on Intelligent Transportation Systems}, 
    title={Efficient Scale-Adaptive License Plate Detection System}, 
    year={2018}, 
    volume={}, 
    number={}, 
    pages={1-13}, 
    keywords={Licenses;Detectors;Feature extraction;Deformable models;Lighting;Robustness;Image edge detection;License plate detection;GentleBoost;scale-adaptive part-based model;video surveillance}, 
    doi={10.1109/TITS.2018.2859035}, 
    ISSN={1524-9050}, 
    month={},}
  • [DOI] I. González-Díaz, “DermaKNet: Incorporating the knowledge of dermatologists to Convolutional Neural Networks for skin lesion diagnosis,” IEEE Journal of Biomedical and Health Informatics, pp. 1-1, 2018.
    [Bibtex]
    @article{Gonzalez18, 
    author={I. González-Díaz}, 
    journal={IEEE Journal of Biomedical and Health Informatics}, 
    title={DermaKNet: Incorporating the knowledge of dermatologists to Convolutional Neural Networks for skin lesion diagnosis}, 
    year={2018}, 
    volume={}, 
    number={}, 
    pages={1-1}, 
    keywords={Image segmentation;Informatics;Lesions;Malignant tumors;Skin;Solid modeling;Task analysis;CAD;Convolutional Neural Networks;Dermoscopy;Melanoma;Skin lesion analysis}, 
    doi={10.1109/JBHI.2018.2806962}, 
    ISSN={2168-2194}, 
    month={}, 
    key= {cogmax}}
  • [DOI] J. López-Labraca, M. Á. Fernández-Torres, I. González-Díaz, F. Díaz-de-María, and Á. Pizarro, “Enriched dermoscopic-structure-based cad system for melanoma diagnosis,” Multimedia Tools and Applications, vol. 77, iss. 10, pp. 12171-12202, 2018.
    [Bibtex]
    @ARTICLE{Lopez-Labraca2018, 
    author="L{\'o}pez-Labraca, Javier
    and Fern{\'a}ndez-Torres, Miguel {\'A}ngel
    and Gonz{\'a}lez-D{\'i}az, Iv{\'a}n
    and D{\'i}az-de-Mar{\'i}a, Fernando
    and Pizarro, {\'A}ngel",
    journal={Multimedia Tools and Applications}, 
    title={Enriched dermoscopic-structure-based cad system for melanoma diagnosis}, 
    year={2018}, 
    volume={77}, 
    number={10}, 
    pages={12171-12202}, 
    keywords={Computer-Aided Diagnosis, melanoma diagnosis, enriched diagnosis, dermoscopic structures,  Bayesian fusion}, 
    doi={10.1007/s11042-017-4879-3}, 
    ISSN={1573-7721}, 
    month={May},}
  • [DOI] E. Martínez-Enríquez, J. Cid-Sueiro, F. Díaz-de-María, and A. Ortega, “Optimized Update/Prediction Assignment for Lifting Transforms on Graphs,” IEEE Transactions on Signal Processing, vol. 66, iss. 8, pp. 2098-2111, 2018.
    [Bibtex]
    @ARTICLE{Martinez-Enriquez2018a, 
    author={E. Martínez-Enríquez and J. Cid-Sueiro and F. Díaz-de-María and A. Ortega}, 
    journal={IEEE Transactions on Signal Processing}, 
    title={Optimized Update/Prediction Assignment for Lifting Transforms on Graphs}, 
    year={2018}, 
    volume={66}, 
    number={8}, 
    pages={2098-2111}, 
    keywords={feature extraction;graph theory;optimisation;transforms;video signal processing;randomly generated graph signals;optimal U/P assignment;update/prediction assignment problem;good bipartition;feature extraction;transformations;optimized update/prediction assignment;Transforms;Indexes;Correlation;Topology;Compaction;Manganese;Noise reduction;Lifting transform;Graphs;$\mathcal{U}/\mathcal{P}$assignment;splitting;graph bipartition}, 
    doi={10.1109/TSP.2018.2802465}, 
    ISSN={1053-587X}, 
    month={April},}
  • [DOI] E. Martínez-Enríquez, J. Cid-Sueiro, F. Díaz-de-María, and A. Ortega, “Directional Transforms for Video Coding Based on Lifting on Graphs,” IEEE Transactions on Circuits and Systems for Video Technology, vol. 28, iss. 4, pp. 933-946, 2018.
    [Bibtex]
    @ARTICLE{Martinez-Enriquez2018b, 
    author={E. Martínez-Enríquez and J. Cid-Sueiro and F. Díaz-de-María and A. Ortega}, 
    journal={IEEE Transactions on Circuits and Systems for Video Technology}, 
    title={Directional Transforms for Video Coding Based on Lifting on Graphs}, 
    year={2018}, 
    volume={28}, 
    number={4}, 
    pages={933-946}, 
    keywords={data compression;filtering theory;graph theory;image filtering;image motion analysis;video coding;wavelet transforms;video coding;lifting transforms;video signal;temporal motion-related pixels;nonsimilar pixels;filtering operations;linked nodes;wavelet transforms;complete video encoder;temporal filtering wavelet;graph splitting;graph construction;H.264-AVC;3D directional transform;Wavelet transforms;Multiresolution analysis;Video coding;Encoding;Motion estimation;Entropy;Directional transforms;lifting transform;signal processing on graphs;video coding}, 
    doi={10.1109/TCSVT.2016.2633418}, 
    ISSN={1051-8215}, 
    month={April},}
  • [DOI] F. Fernández-Martínez, A. Hernández-García, M. A. Fernández-Torres, I. González-Díaz, Á. García-Faura, and F. Díaz-de-María, “Exploiting visual saliency for assessing the impact of car commercials upon viewers,” Multimedia Tools and Applications, vol. 77, iss. 15, pp. 18903-18933, 2018.
    [Bibtex]
    @ARTICLE{FernandezMartinez2018, 
    author="Fern{\'a}ndez-Mart{\'i}nez, F.
    and Hern{\'a}ndez-Garc{\'i}a, A.
    and Fern{\'a}ndez-Torres, M. A.
    and Gonz{\'a}lez-D{\'i}az, I.
    and Garc{\'i}a-Faura, {\'A}.
    and  D{\'i}az-de-Mar{\'i}a, F.",
    journal={Multimedia Tools and Applications}, 
    title={Exploiting visual saliency for assessing the impact of car commercials upon viewers}, 
    year={2018}, 
    volume={77}, 
    number={15}, 
    pages={18903-18933}, 
    keywords={Visual attention, Saliency, Scene analysis, Aesthetics assessment, Feature extraction, Video impact assessment}, 
    doi={10.1007/s11042-017-4879-3}, 
    ISSN={1573-7721}, 
    month={August},}
  • [DOI] F. J. Valverde-Albacete and C. Peláez-Moreno, “K-Formal Concept Analysis as linear algebra over idempotent semifields,” Information Sciences, vol. 467, pp. 579-603, 2018.
    [Bibtex]
    @article{val:pel:18c,
    title = "K-Formal Concept Analysis as linear algebra over idempotent semifields",
    journal = "Information Sciences",
    volume = "467",
    pages = "579 - 603",
    year = "2018",
    issn = "0020-0255",
    doi = "https://doi.org/10.1016/j.ins.2018.07.067",
    url = "http://www.sciencedirect.com/science/article/pii/S0020025516312051",
    author = "Francisco J. Valverde-Albacete and Carmen Pel\'aez-Moreno",
    keywords = "Generalised Formal Concept Analysis, Concept lattice, Neighborhood lattice, Idempotent semiring, Dioid, Confusion matrix",
    abstract = "We report on progress in characterizing K-valued FCA in algebraic terms, where K is an idempotent semifield. In this data mining-inspired approach, incidences are matrices and sets of objects and attributes are vectors. The algebraization allows us to write matrix-calculus formulae describing the polars and the fixpoint equations for extents and intents. Adopting also the point of view of the theory of linear operators between vector spaces we explore the similarities and differences of the idempotent semimodules of extents and intents with the subspaces related to a linear operator in standard algebra. This allows us to shed some light into Formal Concept Analysis from the point of view of the theory of linear operators over idempotent semimodules. In the opposite direction, we state the importance of FCA-related concepts for dual order homomorphisms of linear spaces over idempotent semifields, specially congruences, the lattices of extents, intents and formal concepts."
    }
  • [DOI] F. J. Valverde-Albacete and C. Peláez-Moreno, “Assessing Information Transmission in Data Transformations with the Channel Multivariate Entropy Triangle,” Entropy, vol. 20, iss. 7, 2018.
    [Bibtex]
    @Article{val:pel:18b,
    AUTHOR = {Valverde-Albacete, Francisco J. and Pel\'aez-Moreno, Carmen},
    TITLE = {Assessing Information Transmission in Data Transformations with the Channel Multivariate Entropy Triangle},
    JOURNAL = {Entropy},
    VOLUME = {20},
    YEAR = {2018},
    NUMBER = {7},
    ARTICLE-NUMBER = {498},
    URL = {http://www.mdpi.com/1099-4300/20/7/498},
    ISSN = {1099-4300},
    ABSTRACT = {Data transformation, e.g., feature transformation and selection, is an integral part of any machine learning procedure. In this paper, we introduce an information-theoretic model and tools to assess the quality of data transformations in machine learning tasks. In an unsupervised fashion, we analyze the transformation of a discrete, multivariate source of information X¯ into a discrete, multivariate sink of information Y¯ related by a distribution PX¯Y¯. The first contribution is a decomposition of the maximal potential entropy of (X¯,Y¯), which we call a balance equation, into its (a) non-transferable, (b) transferable, but not transferred, and (c) transferred parts. Such balance equations can be represented in (de Finetti) entropy diagrams, our second set of contributions. The most important of these, the aggregate channel multivariate entropy triangle, is a visual exploratory tool to assess the effectiveness of multivariate data transformations in transferring information from input to output variables. We also show how these decomposition and balance equations also apply to the entropies of X¯ and Y¯, respectively, and generate entropy triangles for them. As an example, we present the application of these tools to the assessment of information transfer efficiency for Principal Component Analysis and Independent Component Analysis as unsupervised feature transformation and selection procedures in supervised classification tasks.},
    DOI = {10.3390/e20070498}
    }
  • [DOI] A. Rodríguez-Hidalgo, C. Peláez-Moreno, and A. Gallardo-Antolín, “The Robustness of Echoic Log-Surprise Auditory Saliency Detection,” IEEE Access, vol. 6, pp. 72083-72093, 2018.
    [Bibtex]
    @ARTICLE{rod:pel:gal:18b,
    author={A. Rodr\'iguez-Hidalgo and C. Pel\'aez-Moreno and A. Gallardo-Antol\'in},
    journal={IEEE Access},
    title={The Robustness of Echoic Log-Surprise Auditory Saliency Detection},
    year={2018},
    volume={6},
    number={},
    pages={72083-72093},
    keywords={Acoustics;Robustness;Task analysis;Saliency detection;Signal processing algorithms;Bayes methods;Spectrogram;Acoustic saliency;echoic memory;multi-scale;statistical divergence;Jensen-Shannon;acoustic event detection},
    doi={10.1109/ACCESS.2018.2882055},
    ISSN={2169-3536},
    month={},}
  • [DOI] A. Rodríguez-Hidalgo, C. Peláez-Moreno, and A. Gallardo-Antolín, “Echoic log-surprise: A multi-scale scheme for acoustic saliency detection,” Expert Systems with Applications, vol. 114, pp. 255-266, 2018.
    [Bibtex]
    @article{rod:pel:gal:18,
    title = {Echoic log-surprise: A multi-scale scheme for acoustic saliency detection},
    journal = {Expert Systems with Applications},
    volume = {114},
    pages = {255 - 266},
    year = {2018},
    issn = {0957-4174},
    doi = {https://doi.org/10.1016/j.eswa.2018.07.018},
    url = {http://www.sciencedirect.com/science/article/pii/S0957417418304330},
    author = {Antonio Rodr\'iguez-Hidalgo and Carmen Pel\'aez-Moreno and Ascensi\'on Gallardo-Antol\'in},
    keywords = {Acoustic saliency, Echoic memory, Multi-scale, Statistical divergence, Jensen–Shannon, Acoustic Event Detection},
    abstract = {Perceptual signals such as acoustic or visual cues carry a massive amount of information. From a human perspective, this problem is solved by means of cognitive mechanisms related to attention. In particular, saliency is a property of particular stimuli that makes them stand from others to allow the brain to take decisions about their relevance in the process of exploring the world. For artificial intelligence systems it is advantageous to mimic these mechanisms. Visual saliency algorithms have been successfully employed in tasks such as medical diagnosis, detection of violent scenes, environment understanding made by robots, etc. In contrast, computational models of the acoustic saliency mechanisms are less extended. In this context, we propose a novel acoustic saliency algorithm to be used by intelligent and expert systems facing tasks such as sound detection and classification, early alarm, surveillance, robotic exploration of the surroundings, among many other applications. This technique, we termed echoic log-surprise, combines an unsupervised statistical approach based on Bayesian log-surprise and the biological concept of echoic or Auditory Sensory Memory. Our algorithm computes several independent log-surprise cues in parallel considering a wide range of memory values, with the aim of leveraging saliency information from different temporal scales. Then, we explore several statistical metrics to combine these multi-scale signals in a single temporal saliency signal including Renyi entropy, Jensen-Shannon divergence, Cramer or Bhattacharyya distances. We have adopted Acoustic Event Detection tasks as adequate proxies to test its performance. Results show that the proposed echoic log-surprise method outperforms classical acoustic detection techniques commonly deployed in intelligent and expert systems, such as energy thresholding or voice activity detection, and it also achieves better results than some other state-of-the-art acoustic saliency algorithms, such as Kalinli’s and conventional log-surprise.}
    }
  • [DOI] G. I. Díaz, “DermaKNet: Incorporating the knowledge of dermatologists to Convolutional Neural Networks for skin lesion diagnosis,” IEEE Journal of Biomedical and Health Informatics, iss. 99, pp. 1-1, 2018.
    [Bibtex]
    @article{Gonzalez18,
    author={I. González Díaz},
    journal={IEEE Journal of Biomedical and Health Informatics},
    title={DermaKNet: Incorporating the knowledge of dermatologists to Convolutional Neural Networks for skin lesion diagnosis},
    year={2018},
    volume={},
    number={99},
    pages={1-1},
    keywords={Image segmentation;Informatics;Lesions;Malignant tumors;Skin;Solid modeling;Task analysis;CAD;Convolutional Neural Networks;Dermoscopy;Melanoma;Skin lesion analysis},
    doi={10.1109/JBHI.2018.2806962},
    ISSN={2168-2194},
    month={},
    key= {cogmax}}

2017

  • [DOI] J. Ludeña-Choez, R. Quispe-Soncco, and A. Gallardo-Antolín, “Bird sound spectrogram decomposition through Non-Negative Matrix Factorization for the acoustic classification of bird species,” PLOS ONE, vol. 12, iss. 6, pp. 1-20, 2017.
    [Bibtex]
    @article{Ludena-Choez2017,
    author = {Lude{\~}na-Choez, Jimmy and Quispe-Soncco, Raisa and Gallardo-Antol{\'i}n, Ascensi{\'o}n},
    journal = {PLOS ONE},
    publisher = {Public Library of Science},
    title = {Bird sound spectrogram decomposition through Non-Negative Matrix Factorization for the acoustic classification of bird species},
    year = {2017},
    month = {06},
    volume = {12},
    url = {https://doi.org/10.1371/journal.pone.0179403},
    pages = {1-20},
    number = {6},
    doi = {10.1371/journal.pone.0179403}
    }
  • [DOI] F. de-la-Calle-Silos and R. M. Stern, “Synchrony-Based Feature Extraction for Robust Automatic Speech Recognition,” IEEE Signal Processing Letters, vol. 24, iss. 8, pp. 1158-1162, 2017.
    [Bibtex]
    @article{de-la-Calle-Silos2017,
    author={de-la-Calle-Silos, Fernando and Stern, Richard M.},
    journal={IEEE Signal Processing Letters},
    title={Synchrony-Based Feature Extraction for Robust Automatic Speech Recognition},
    year={2017},
    volume={24},
    number={8},
    pages={1158-1162},
    keywords={feature extraction;speech recognition;noise removal;noise suppression;multiple standard speech databases;generalized synchrony detector;putative synchrony;temporal patterns;auditory-nerve activity;feature extraction schemes;automatic speech recognition system robustness enhancement;auditory-nerve firings;temporal pattern model application;robust automatic speech recognition;synchrony-based feature extraction;Feature extraction;Mel frequency cepstral coefficient;Speech recognition;Speech;Robustness;Frequency synchronization;Databases;Auditory modeling;auditory synchrony;feature extraction;physiological modeling;robust speech recognition},
    doi={10.1109/LSP.2017.2714192},
    ISSN={1070-9908},
    month={Aug},}
  • [DOI] J. L. González-de-Suso, E. Martínez-Enríquez, and F. Díaz-de-María, “Adaptive Lagrange multiplier estimation algorithm in HEVC,” Signal Processing: Image Communication, vol. 56, pp. 40-51, 2017.
    [Bibtex]
    @article{GONZALEZDESUSO2017,
    title = "Adaptive Lagrange multiplier estimation algorithm in HEVC",
    journal = "Signal Processing: Image Communication",
    volume = "56",
    pages = "40 - 51",
    year = "2017",
    issn = "0923-5965",
    doi = "https://doi.org/10.1016/j.image.2017.04.010",
    url = "http://www.sciencedirect.com/science/article/pii/S0923596517300760",
    author = "José Luis González-de-Suso and Eduardo Martínez-Enríquez and Fernando Díaz-de-María",
    keywords = "HEVC, Motion estimation, Rate-distortion optimization, Source coding, Video coding",
    month={August},
    }
  • [DOI] A. Jiménez-Moreno, E. Martínez-Enríquez, and F. Díaz-de-María, “Bayesian adaptive algorithm for fast coding unit decision in the High Efficiency Video Coding (HEVC) standard,” Signal Processing: Image Communication, vol. 56, pp. 1-11, 2017.
    [Bibtex]
    @article{JIMENEZMORENO2017,
    title = "Bayesian adaptive algorithm for fast coding unit decision in the High Efficiency Video Coding (HEVC) standard",
    journal = "Signal Processing: Image Communication",
    volume = "56",
    pages = "1 - 11",
    year = "2017",
    issn = "0923-5965",
    doi = "https://doi.org/10.1016/j.image.2017.04.004",
    url = "http://www.sciencedirect.com/science/article/pii/S092359651730070X",
    author = "Amaya Jiménez-Moreno and Eduardo Martínez-Enríquez and Fernando Díaz-de-María",
    month={August},
    }
  • [DOI] I. González-Díaz, M. Birinci, F. Díaz-de-María, and E. J. Delp, “Neighborhood Matching for Image Retrieval,” IEEE Transactions on Multimedia, vol. 19, iss. 3, pp. 544-558, 2017.
    [Bibtex]
    @ARTICLE{Gonzalez-Diaz2017, 
    author={I. González-Díaz and M. Birinci and F. Díaz-de-María and E. J. Delp}, 
    journal={IEEE Transactions on Multimedia}, 
    title={Neighborhood Matching for Image Retrieval}, 
    year={2017}, 
    volume={19}, 
    number={3}, 
    pages={544-558}, 
    keywords={computational complexity;formal verification;geometry;image matching;image retrieval;neighborhood matching;large-scale image retrieval framework;multimedia community;initial reference image ranking;fast approximations;image geometric layout;computational complexity;keypoint matching process;geometric verification step;computational efficiency;Oxford 5 k dataset;Oxford 105 k dataset;Visualization;Image retrieval;Computational complexity;Feature extraction;Computational modeling;Vocabulary;Histograms;Geometric verification;image retrieval;neighborhood matching (NM);robust estimation}, 
    doi={10.1109/TMM.2016.2616298}, 
    ISSN={1520-9210}, 
    month={March},}
  • [DOI] F. J. Valverde-Albacete and C. Peláez-Moreno, “The Evaluation of Data Sources using Multivariate Entropy Tools,” Expert Systems with Applications, vol. 78, pp. 145-157, 2017.
    [Bibtex]
    @article{val:pel:17b,
      Author = {Valverde-Albacete, Francisco J and Pel\'aez-Moreno, C},
      Date-Added = {2017-01-13 13:55:34 +0000},
      Date-Modified = {2017-03-02 10:56:57 +0000},
      Doi = {10.1016/j.eswa.2017.02.010},
      Journal = {Expert Systems with Applications},
      Pages = {145-157},
      Title = {The Evaluation of Data Sources using Multivariate Entropy Tools},
      Volume = {78},
      Year = {2017},
      Bdsk-Url-1 = {http://dx.doi.org/10.1016/j.eswa.2017.02.010},
      key = {cogmax}}
  • F. J. Valverde Albacete and C. Peláez-Moreno, “Entropy operates in Non-Linear Semifields,” Arxiv, iss. 1710.04728 [cs.IT], 2017.
    [Bibtex]
    @article{val:pel:17c,
      Author = {Valverde Albacete, Francisco Jos\'e and Carmen Pel\'aez-Moreno},
      Date-Added = {2017-11-04 20:13:49 +0000},
      Date-Modified = {2017-12-14 09:49:54 +0000},
      Journal = {Arxiv},
      Number = {1710.04728 [cs.IT]},
      Title = {Entropy operates in Non-Linear Semifields},
      Year = {2017},
      url ={https://arxiv.org/abs/1710.04728},
      key = {cogmax}}
  • [DOI] I. González-Díaz, M. Birinci, F. Díaz-de-María, and E. J. Delp, “Neighborhood Matching for Image Retrieval,” IEEE Transactions on Multimedia, vol. 19, iss. 3, pp. 544-558, 2017.
    [Bibtex]
    @article{Gonzalez17a,
    author={I. González-Díaz and M. Birinci and F. Díaz-de-María and E. J. Delp},
    journal={IEEE Transactions on Multimedia},
    title={Neighborhood Matching for Image Retrieval},
    year={2017},
    volume={19},
    number={3},
    pages={544-558},
    keywords={computational complexity;formal verification;geometry;image matching;image retrieval;Oxford 105 k dataset;Oxford 5 k dataset;computational complexity;computational efficiency;fast approximations;geometric verification step;image geometric layout;initial reference image ranking;keypoint matching process;large-scale image retrieval framework;multimedia community;neighborhood matching;Computational complexity;Computational modeling;Feature extraction;Histograms;Image retrieval;Visualization;Vocabulary;Geometric verification;image retrieval;neighborhood matching (NM);robust estimation},
    doi={10.1109/TMM.2016.2616298},
    ISSN={1520-9210},
    month={March},
    key= {cogmax}}
  • I. González-D’iaz, “Incorporating the Knowledge of Dermatologists to Convolutional Neural Networks for the Diagnosis of Skin Lesions,” CoRR, vol. abs/1703.01976, 2017.
    [Bibtex]
    @article{Gonzalez17b,
      author    = {Iv{\'{a}}n Gonz{\'{a}}lez{-}D{\'{\i}}az},
      title     = {Incorporating the Knowledge of Dermatologists to Convolutional Neural
                   Networks for the Diagnosis of Skin Lesions},
      journal   = {CoRR},
      volume    = {abs/1703.01976},
      year      = {2017},
      url       = {http://arxiv.org/abs/1703.01976},
      archivePrefix = {arXiv},
      eprint    = {1703.01976},
      timestamp = {Wed, 07 Jun 2017 14:41:22 +0200},
      biburl    = {https://dblp.org/rec/bib/journals/corr/González-Díaz17},
      bibsource = {dblp computer science bibliography, https://dblp.org},
      key= {cogmax}
    }

2016

  • I. González-Díaz, V. Buso, and J. Benois-Pineau, “Perceptual modeling in the problem of active object recognition in visual scenes,” Pattern Recognition, vol. 56, iss. Supplement C, pp. 129-141, 2016.
    [Bibtex]
    @article{Gonzalez16,
    title = "Perceptual modeling in the problem of active object recognition in visual scenes",
    journal = "Pattern Recognition",
    volume = "56",
    number = "Supplement C",
    pages = "129 - 141",
    year = "2016",
    issn = "0031-3203",
    author = "Iv{\'{a}}n Gonz{\'{a}}lez{-}D{\'{i}}az and Vincent Buso and Jenny Benois-Pineau",
    keywords = "Perceptual modeling, Visual saliency, Active object recognition, Foveal and peripheral pathways"
    }
  • [DOI] A. Hernández-García, F. Fernández-Martínez, and F. Díaz-de-María, “Comparing visual descriptors and automatic rating strategies for video aesthetics prediction,” Signal Processing: Image Communication, vol. 47, pp. 280-288, 2016.
    [Bibtex]
    @article{HERNANDEZGARCIA2016280,
    title = "Comparing visual descriptors and automatic rating strategies for video aesthetics prediction",
    journal = "Signal Processing: Image Communication",
    volume = "47",
    pages = "280 - 288",
    year = "2016",
    issn = "0923-5965",
    doi = "https://doi.org/10.1016/j.image.2016.07.004",
    url = "http://www.sciencedirect.com/science/article/pii/S0923596516301035",
    author = "A. Hernández-García and F. Fernández-Martínez and F. Díaz-de-María",
    keywords = "Automatic aesthetics prediction, Image descriptors, Video descriptors, YouTube, Automatic annotation",
    month={September},}
  • [DOI] A. Jiménez-Moreno, E. Martínez-Enríquez, and F. Díaz-de-María, “Complexity Control Based on a Fast Coding Unit Decision Method in the HEVC Video Coding Standard,” IEEE Transactions on Multimedia, vol. 18, iss. 4, pp. 563-575, 2016.
    [Bibtex]
    @ARTICLE{JimenezMoreno2016, 
    author={A. Jiménez-Moreno and E. Martínez-Enríquez and F. Díaz-de-María}, 
    journal={IEEE Transactions on Multimedia}, 
    title={Complexity Control Based on a Fast Coding Unit Decision Method in the HEVC Video Coding Standard}, 
    year={2016}, 
    volume={18}, 
    number={4}, 
    pages={563-575}, 
    keywords={computational complexity;data structures;video coding;fast coding unit decision method;HEVC video coding standard;coding tool;prediction unit;transform unit;flexible data representation;computational complexity control algorithm;CC algorithm;hierarchical approach;encoding time;video content;encoding configuration;target complexity reduction method;coding complexity;Encoding;Complexity theory;Standards;Proposals;Streaming media;Complexity control;fast coding unit decision;HEVC;on the fly estimation;Complexity control (CC);fast coding unit decision;high efficiency video coding (HEVC);on the fly estimation}, 
    doi={10.1109/TMM.2016.2524995}, 
    ISSN={1520-9210}, 
    month={April},}
  • [DOI] J. M. González-Calabozo, F. J. Valverde-Albacete, and C. Peláez-Moreno, “Interactive knowledge discovery and data mining on genomic expression data with numeric formal concept analysis,” BMC Bioinformatics, vol. 17, 2016.
    [Bibtex]
    @article{gon:val:pel:16,
       author = {Gonz\'alez-Calabozo, Jos\'e M. and Valverde-Albacete, Francisco J. and Pel\'aez-Moreno, Carmen},
       title = {Interactive knowledge discovery and data mining on genomic expression data with numeric formal concept analysis},
       journal = {{BMC} Bioinformatics},
       volume = {17},
       ISSN = {1471-2105},
       DOI = {10.1186/s12859-016-1234-z},
       url = {://WOS:000383403800002},
       year = {2016},
       type = {Journal Article}
    }
  • [DOI] F. J. Valverde-Albacete and C. Peláez-Moreno, “The spectra of reducible matrices over complete commutative idempotent semifields and their spectral lattices,” International Journal of General Systems, vol. 45, iss. 2, pp. 86-115, 2016.
    [Bibtex]
    @article{val:pel:16,
      Author = {Francisco Jos{\'e} Valverde-Albacete and Carmen Pel{\'a}ez-Moreno},
      Date-Added = {2017-11-05 12:20:30 +0000},
      Date-Modified = {2017-11-05 12:22:07 +0000},
      Doi = {10.1080/03081079.2015.1072923},
      Eprint = {http://dx.doi.org/10.1080/03081079.2015.1072923},
      Journal = {International Journal of General Systems},
      Number = {2},
      Pages = {86-115},
      Publisher = {Taylor & Francis},
      Title = {The spectra of reducible matrices over complete commutative idempotent semifields and their spectral lattices},
      Url = {http://dx.doi.org/10.1080/03081079.2015.1072923},
      Volume = {45},
      Year = {2016},
      Bdsk-Url-1 = {http://dx.doi.org/10.1080/03081079.2015.1072923},
      key = {cogmax}}
  • [DOI] J. Ludeña-Choez and A. Gallardo-Antolín, “Acoustic Event Classification using spectral band selection and Non-Negative Matrix Factorization-based features,” Expert Systems with Applications, vol. 46, pp. 77-86, 2016.
    [Bibtex]
    @article{lud16,
    title = "Acoustic Event Classification using spectral band selection and Non-Negative Matrix Factorization-based features",
    journal = "Expert Systems with Applications",
    volume = "46",
    pages = "77 - 86",
    year = "2016",
    issn = "0957-4174",
    doi = "https://doi.org/10.1016/j.eswa.2015.10.018",
    url = "http://www.sciencedirect.com/science/article/pii/S0957417415007137",
    author = "Jimmy Ludeña-Choez and Ascensión Gallardo-Antolín",
    keywords = "Acoustic Event Classification, Feature extraction, Temporal feature integration, Feature selection, Mutual information, Non-Negative Matrix Factorization",
    key = {samurai}
    }
  • [DOI] A. Jiménez-Moreno, E. Martínez-Enríquez, and F. Díaz-de-María, “Complexity Control Based on a Fast Coding Unit Decision Method in the HEVC Video Coding Standard,” IEEE Transactions on Multimedia, vol. 18, iss. 4, pp. 563-575, 2016.
    [Bibtex]
    @article{jim16,
    author={A. Jiménez-Moreno and E. Martínez-Enríquez and F. Díaz-de-María},
    journal={IEEE Transactions on Multimedia},
    title={Complexity Control Based on a Fast Coding Unit Decision Method in the HEVC Video Coding Standard},
    year={2016},
    volume={18},
    number={4},
    pages={563-575},
    keywords={computational complexity;data structures;video coding;CC algorithm;HEVC video coding standard;coding complexity;coding tool;computational complexity control algorithm;encoding configuration;encoding time;fast coding unit decision method;flexible data representation;hierarchical approach;prediction unit;target complexity reduction method;transform unit;video content;Complexity theory;Encoding;Proposals;Standards;Streaming media;Complexity control;Complexity control (CC);HEVC;fast coding unit decision;high efficiency video coding (HEVC);on the fly estimation},
    doi={10.1109/TMM.2016.2524995},
    ISSN={1520-9210},
    month={April},
    key = {samurai}}
  • [DOI] I. González-Díaz, V. Buso, and J. Benois-Pineau, “Perceptual modeling in the problem of active object recognition in visual scenes,” Pattern Recognition, vol. 56, pp. 129-141, 2016.
    [Bibtex]
    @article{RN405,
       author = {González-Díaz, Ivan and Buso, Vincent and Benois-Pineau, Jenny},
       title = {Perceptual modeling in the problem of active object recognition in visual scenes},
       journal = {Pattern Recognition},
       volume = {56},
       pages = {129-141},
       ISSN = {0031-3203},
       DOI = {10.1016/j.patcog.2016.03.007},
       url = {://WOS:000375360900011},
       year = {2016},
       type = {Journal Article}
    }
  • [DOI] F. J. ~. Valverde-Albacete, J.M.~González-Calabozo, A. Peñas, and C. Peláez-Moreno, “Supporting scientific knowledge discovery with extended, generalized Formal Concept Analysis,” Expert Systems with Applications, vol. 44, pp. 198-216, 2016.
    [Bibtex]
    @article{val:gon:pen:pel:15old,
      Author = {Francisco J.~ Valverde-Albacete and J.M.~Gonz\'alez-Calabozo and A. Pe\~nas and Carmen Pel\'aez-Moreno},
       title = {Supporting scientific knowledge discovery with extended, generalized Formal Concept Analysis},
       journal = {Expert Systems with Applications},
       volume = {44},
       pages = {198-216},
       ISSN = {0957-4174},
       DOI = {10.1016/j.eswa.2015.09.022},
       url = {://WOS:000365051500019},
       year = {2016},
       type = {Journal Article}
    }

2015

  • [DOI] V. Buso, I. González-Díaz, and J. Benois-Pineau, “Goal-oriented top-down probabilistic visual attention model for recognition of manipulated objects in egocentric videos,” Signal Processing: Image Communication, vol. 39, 2015.
    [Bibtex]
    @article{Buso15,
    author = {Vincent Buso and Iv{\'{a}}n Gonz{\'{a}}lez{-}D{\'{i}}az  and Jenny Benois-Pineau},
    year = {2015},
    month = {06},
    pages = {},
    title = {Goal-oriented top-down probabilistic visual attention model for recognition of manipulated objects in egocentric videos},
    volume = {39},
    journal = {Signal Processing: Image Communication},
    doi = {10.1016/j.image.2015.05.006}
    }
  • [DOI] M. de-Frutos-López, J. L. González-de-Suso, S. Sanz-Rodríguez, C. Peláez-Moreno, and F. Díaz-de-María, “Two-level sliding-window VBR control algorithm for video on demand streaming,” Signal Processing: Image Communication, vol. 36, pp. 1-13, 2015.
    [Bibtex]
    @article{DEFRUTOSLOPEZ20151,
    title = "Two-level sliding-window VBR control algorithm for video on demand streaming",
    journal = "Signal Processing: Image Communication",
    volume = "36",
    pages = "1 - 13",
    year = "2015",
    issn = "0923-5965",
    doi = "https://doi.org/10.1016/j.image.2015.05.004",
    url = "http://www.sciencedirect.com/science/article/pii/S092359651500079X",
    author = "Manuel de-Frutos-López and José Luis González-de-Suso and Sergio Sanz-Rodríguez and Carmen Peláez-Moreno and Fernando Díaz-de-María",
    keywords = "Video coding, HEVC, Rate control, VBR, Video storage, Video on demand",
    abstract = "A two-level variable bit rate (VBR) control algorithm for hierarchical video coding, specifically tailored for the new High Efficiency Video Coding (HEVC) standard, is presented here. A long-term level monitors the current bit count along a sliding window of a few seconds, comprising several intra-periods (IPs) and shifted on an IP basis. This long-term view allows the accommodation of the naturally occurring rate variations at a slow pace, avoiding the annoying sharp quality changes commonly appearing when non-sliding window approaches are used. The bit excesses or defects observed at this level are evenly delivered to a short-term level mechanism that establishes target bit budgets for a narrower sliding window covering a single IP and shifting on a frame basis. At this level, an adequate quantization parameter is estimated to comply with the designated target bit rate. Recommended test conditions as well as two few minutes long video sequences with scene cuts have been used for the assessment of the proposed VBR controller. Comparisons with a state-of-the-art rate control algorithm have produced good results in terms of quality consistency, in exchange for moderate rate-distortion performance losses."
    }
  • [DOI] I. González-Díaz, T. Martínez-Cortés, A. Gallardo-Antolín, and F. Díaz-de-María, “Temporal segmentation and keyframe selection methods for user-generated video search-based annotation,” Expert Systems with Applications, vol. 42, iss. 1, pp. 488-502, 2015.
    [Bibtex]
    @article{GONZALEZDIAZ2015488,
    title = "Temporal segmentation and keyframe selection methods for user-generated video search-based annotation",
    journal = "Expert Systems with Applications",
    volume = "42",
    number = "1",
    pages = "488 - 502",
    year = "2015",
    issn = "0957-4174",
    doi = "https://doi.org/10.1016/j.eswa.2014.08.001",
    url = "http://www.sciencedirect.com/science/article/pii/S0957417414004771",
    author = "Iván González-Díaz and Tomás Martínez-Cortés and Ascensión Gallardo-Antolín and Fernando Díaz-de-María",
    keywords = "User Generated Video, Video annotation, Video temporal segmentation, Camera motion analysis, Keyframe selection",
    abstract = "In this paper we propose a temporal segmentation and a keyframe selection method for User-Generated Video (UGV). Since UGV is rarely structured in shots and usually user’s interest are revealed through camera movements, a UGV temporal segmentation system has been proposed that generates a video partition based on a camera motion classification. Motion-related mid-level features have been suggested to feed a Hierarchical Hidden Markov Model (HHMM) that produces a user-meaningful UGV temporal segmentation. Moreover, a keyframe selection method has been proposed that picks a keyframe for fixed-content camera motion patterns such as zoom, still, or shake and a set of keyframes for varying-content translation patterns. The proposed video segmentation approach has been compared to a state-of-the-art algorithm, achieving 8\% performance improvement in a segmentation-based evaluation. Furthermore, a complete search-based UGV annotation system has been developed to assess the influence of the proposed algorithms on an end-user task. To that purpose, two UGV datasets have been developed and made available online. Specifically, the relevance of the considered camera motion types has been analyzed for these two datasets, and some guidelines are given to achieve the desired performance-complexity tradeoff. The keyframe selection algorithm for varying-content translation patterns has also been assessed, revealing a notable contribution to the performance of the global UGV annotation system. Finally, it has been shown that the UGV segmentation algorithm also produces improved annotation results with respect to a fixed-rate keyframe selection baseline or a traditional method relying on frame-level visual features."
    }
  • [DOI] F. Fernández-Martínez, A. Hernández-García, and F. Díaz-de-María, “Succeeding metadata based annotation scheme and visual tips for the automatic assessment of video aesthetic quality in car commercials,” Expert Systems with Applications, vol. 42, iss. 1, pp. 293-305, 2015.
    [Bibtex]
    @article{FERNANDEZMARTINEZ2015293,
    title = "Succeeding metadata based annotation scheme and visual tips for the automatic assessment of video aesthetic quality in car commercials",
    journal = "Expert Systems with Applications",
    volume = "42",
    number = "1",
    pages = "293 - 305",
    year = "2015",
    issn = "0957-4174",
    doi = "https://doi.org/10.1016/j.eswa.2014.07.033",
    url = "http://www.sciencedirect.com/science/article/pii/S0957417414004400",
    author = "F. Fernández-Martínez and A. Hernández-García and F. Díaz-de-María",
    keywords = "Automatic video annotation, Aesthetic quality assessment, Video sentiment analysis, Video metadata, YouTube",
    abstract = "In this paper, we present a computational model capable to predict the viewer perception of car advertisements videos by using a set of low-level video descriptors. Our research goal relies on the hypothesis that these descriptors could reflect the aesthetic value of the videos and, in turn, their viewers’ perception. To that effect, and as a novel approach to this problem, we automatically annotate our video corpus, downloaded from YouTube, by applying an unsupervised clustering algorithm to the retrieved metadata linked to the viewers’ assessments of the videos. In this regard, a regular k-means algorithm is applied as partitioning method with k ranging from 2 to 5 clusters, modeling different satisfaction levels or classes. On the other hand, available metadata is categorized into two different types based on the profile of the viewers of the videos: metadata based on explicit and implicit opinion respectively. These two types of metadata are first individually tested and then combined together resulting in three different models or strategies that are thoroughly analyzed. Typical feature selection techniques are used over the implemented video descriptors as a pre-processing step in the classification of viewer perception, where several different classifiers have been considered as part of the experimental setup. Evaluation results show that the proposed video descriptors are clearly indicative of the subjective perception of viewers regardless of the implemented strategy and the number of classes considered. The strategy based on explicit opinion metadata clearly outperforms the implicit one in terms of classification accuracy. Finally, the combined approach slightly improves the explicit, achieving a top accuracy of 72.18\% when distinguishing between 2 classes, and suggesting that better classification results could be obtained by using suitable metrics to model perception derived from all available metadata."
    }
  • [DOI] F. de-la-Calle-Silos, F. J. Valverde-Albacete, A. Gallardo-Antolín, and C. Peláez-Moreno, “Morphologically Filtered Power-Normalized Cochleograms as Robust, Biologically Inspired Features for ASR,” IEEE/ACM Transactions on Audio, Speech and Language Processing (TASLP), vol. 23, iss. 11, pp. 2070-2080, 2015.
    [Bibtex]
    @article{cal:val:gal:pel:15,
        Author = {de-la-Calle-Silos, Fernando and Valverde-Albacete, Francisco J and Gallardo-Antol{\'i}n, Ascensi{\'o}n and Pel{\'a}ez-Moreno, Carmen},
       title = {Morphologically Filtered Power-Normalized Cochleograms as Robust, Biologically Inspired Features for {ASR}},
      Journal = {{IEEE/ACM} Transactions on Audio, Speech and Language Processing {(TASLP)}},
       volume = {23},
       number = {11},
       pages = {2070-2080},
       ISSN = {2329-9290},
       DOI = {10.1109/taslp.2015.2464691},
       url = {://WOS:000360835000031},
       year = {2015},
       key = {samurai},
       type = {Journal Article}
    }
  • [DOI] V. Buso, I. González-Díaz, and J. Benois-Pineau, “Goal-oriented top-down probabilistic visual attention model for recognition of manipulated objects in egocentric videos,” Signal Processing-Image Communication, vol. 39, pp. 418-431, 2015.
    [Bibtex]
    @article{RN410,
       author = {Buso, Vincent and González-Díaz, Ivan and Benois-Pineau, Jenny},
       title = {Goal-oriented top-down probabilistic visual attention model for recognition of manipulated objects in egocentric videos},
       journal = {Signal Processing-Image Communication},
       volume = {39},
       pages = {418-431},
       ISSN = {0923-5965},
       DOI = {10.1016/j.image.2015.05.006},
       url = {://WOS:000367412800009},
       year = {2015},
       type = {Journal Article},
       key = {samurai}
    }
  • [DOI] M. de-Frutos-Lopez, J. Luis González-de-Suso, S. Sanz-Rodriguez, C. Peláez-Moreno, and F. Díaz-de-María, “Two-level sliding-window VBR control algorithm for video on demand streaming,” Signal Processing-Image Communication, vol. 36, pp. 1-13, 2015.
    [Bibtex]
    @article{RN412,
       author = {de-Frutos-Lopez, Manuel and Luis González-de-Suso, José and Sanz-Rodriguez, Sergio and Peláez-Moreno, Carmen and Díaz-de-María, Fernando},
       title = {Two-level sliding-window VBR control algorithm for video on demand streaming},
       journal = {Signal Processing-Image Communication},
       volume = {36},
       pages = {1-13},
       ISSN = {0923-5965},
       DOI = {10.1016/j.image.2015.05.004},
       url = {://WOS:000360874700001},
       year = {2015},
       type = {Journal Article},
       key = {samurai}
    }
  • [DOI] I. González-Díaz, T. Martinez-Cortes, A. Gallardo-Antolin, and F. Díaz-de-María, “Temporal segmentation and keyframe selection methods for user-generated video search-based annotation,” Expert Systems with Applications, vol. 42, iss. 1, pp. 488-502, 2015.
    [Bibtex]
    @article{RN418,
       author = {González-Díaz, Ivan and Martinez-Cortes, Tomas and Gallardo-Antolin, Ascension and Díaz-de-María, Fernando},
       title = {Temporal segmentation and keyframe selection methods for user-generated video search-based annotation},
       journal = {Expert Systems with Applications},
       volume = {42},
       number = {1},
       pages = {488-502},
       ISSN = {0957-4174},
       DOI = {10.1016/j.eswa.2014.08.001},
       url = {://WOS:000344034300040},
       year = {2015},
       type = {Journal Article}
    }
  • [DOI] J. Ludena-Choez and A. Gallardo-Antolin, “Feature extraction based on the high-pass filtering of audio signals for Acoustic Event Classification,” Computer Speech and Language, vol. 30, iss. 1, pp. 32-42, 2015.
    [Bibtex]
    @article{RN414,
       author = {Ludena-Choez, Jimmy and Gallardo-Antolin, Ascension},
       title = {Feature extraction based on the high-pass filtering of audio signals for Acoustic Event Classification},
       journal = {Computer Speech and Language},
       volume = {30},
       number = {1},
       pages = {32-42},
       ISSN = {0885-2308},
       DOI = {10.1016/j.csl.2014.04.001},
       url = {://WOS:000345556600004},
       year = {2015},
       type = {Journal Article}
    }
  • [DOI] F. J. Valverde-Albacete and C. Peláez-Moreno, “The spectra of irreducible matrices over completed idempotent semifields,” Fuzzy Sets and Systems, vol. 271, pp. 46-69, 2015.
    [Bibtex]
    @article{RN413,
       author = {Valverde-Albacete, Francisco J. and Peláez-Moreno, Carmen},
       title = {The spectra of irreducible matrices over completed idempotent semifields},
       journal = {Fuzzy Sets and Systems},
       volume = {271},
       pages = {46-69},
       ISSN = {0165-0114},
       DOI = {10.1016/j.fss.2014.09.022},
       url = {://WOS:000353216600005},
       year = {2015},
       type = {Journal Article}
    }

2014

  • [DOI] A. Jiménez-Moreno, E. Martínez-Enríquez, V. Kumar, and D. F. de María, “Standard-Compliant Low-Pass Temporal Filter to Reduce the Perceived Flicker Artifact,” IEEE Transactions on Multimedia, vol. 16, iss. 7, pp. 1863-1873, 2014.
    [Bibtex]
    @ARTICLE{Jimenez-Moreno 2014, 
    author={A. Jiménez-Moreno and E. Martínez-Enríquez and V. Kumar and F. Díaz de María}, 
    journal={IEEE Transactions on Multimedia}, 
    title={Standard-Compliant Low-Pass Temporal Filter to Reduce the Perceived Flicker Artifact}, 
    year={2014}, 
    volume={16}, 
    number={7}, 
    pages={1863-1873}, 
    keywords={data compression;filtering theory;image motion analysis;social networking (online);video coding;standard-compliant low-pass temporal filter;perceived Flicker artifact reduction method;video-compression-related temporal artifact;luminance changes;block-by-block basis;video coding standards;bitstream generation;PSNR loss;H.264-AVC reference software;coding efficiency;motion-guided temporal filtering;Standards;Encoding;PSNR;Measurement;Video coding;Quantization (signal);Decoding;Flicker artifact;flicker reduction;H.264/AVC;low-pass temporal filtering;motion-guided temporal filtering;on-the-fly filter strength control;standard compliant}, 
    doi={10.1109/TMM.2014.2347257}, 
    ISSN={1520-9210}, 
    month={Nov},}
  • [DOI] J. L. González-de-Suso, A. Jiménez-Moreno, E. Martínez-Enríquez, and F. Díaz-de-María, “Improved Method to Select the Lagrange Multiplier for Rate-Distortion Based Motion Estimation in Video Coding,” IEEE Transactions on Circuits and Systems for Video Technology, vol. 24, iss. 3, pp. 452-464, 2014.
    [Bibtex]
    @ARTICLE{Gonzalez-de-Suso2014, 
    author={J. L. González-de-Suso and A. Jiménez-Moreno and E. Martínez-Enríquez and F. Díaz-de-María}, 
    journal={IEEE Transactions on Circuits and Systems for Video Technology}, 
    title={Improved Method to Select the Lagrange Multiplier for Rate-Distortion Based Motion Estimation in Video Coding}, 
    year={2014}, 
    volume={24}, 
    number={3}, 
    pages={452-464}, 
    keywords={image segmentation;motion estimation;video coding;rate distortion;motion estimation;video coding;ME process;H.264/AVC reference software;Lagrangian parameter;ME errors;video segmentation;coding quality;context adaptive Lagrange multiplier;Encoding;Estimation;Video coding;Optimization;Software;Motion segmentation;Standards;H264/Advanced Video Coding (AVC);Lagrange multiplier;motion estimation;rate-distortion optimization;video coding}, 
    doi={10.1109/TCSVT.2013.2276857}, 
    ISSN={1051-8215}, 
    month={March},}
  • [DOI] I. González-Díaz, C. E. Baz-Hormigos, and F. Díaz-de-María, “A Generative Model for Concurrent Image Retrieval and ROI Segmentation,” IEEE Transactions on Multimedia, vol. 16, iss. 1, pp. 169-183, 2014.
    [Bibtex]
    @ARTICLE{Gonzalez-Diaz2014, 
    author={Iván González-Díaz and C. E. Baz-Hormigos and F. Díaz-de-María}, 
    journal={IEEE Transactions on Multimedia}, 
    title={A Generative Model for Concurrent Image Retrieval and ROI Segmentation}, 
    year={2014}, 
    volume={16}, 
    number={1}, 
    pages={169-183}, 
    keywords={image matching;image retrieval;image segmentation;object detection;probability;probabilistic generative model;concurrent image retrieval;ROI segmentation;region-of-interest segmentation;image matching process;geometric transformation;region of interest spatial location;visual similarity;query image;geometrically constrained matching;image segmentation;object detection;multiobject image retrieval tasks;multiview image retrieval;Computational modeling;Image segmentation;Image retrieval;Visualization;Vocabulary;Probabilistic logic;Quantization (signal);Image retrieval;Object segmentation;Object recognition;Image Databases;Computer Vision}, 
    doi={10.1109/TMM.2013.2286083}, 
    ISSN={1520-9210}, 
    month={Jan},}
  • [DOI] I. González-Díaz, C. E. Baz-Hormigos, and F. Díaz-de-María, “A Generative Model for Concurrent Image Retrieval and ROI Segmentation,” Ieee Transactions on Multimedia, vol. 16, iss. 1, pp. 169-183, 2014.
    [Bibtex]
    @article{RN422,
       author = {González-Díaz, Ivan and Baz-Hormigos, Carlos E. and Díaz-de-María, Fernando},
       title = {A Generative Model for Concurrent Image Retrieval and ROI Segmentation},
       journal = {Ieee Transactions on Multimedia},
       volume = {16},
       number = {1},
       pages = {169-183},
       ISSN = {1520-9210},
       DOI = {10.1109/tmm.2013.2286083},
       url = {://WOS:000328948100015},
       year = {2014},
       type = {Journal Article}
    }
  • [DOI] F. J. Valverde-Albacete and C. Peláez-Moreno, “100% Classification Accuracy Considered Harmful: The Normalized Information Transfer Factor Explains the Accuracy Paradox,” Plos One, vol. 9, iss. 1, 2014.
    [Bibtex]
    @article{RN419,
       author = {Valverde-Albacete, Francisco J. and Peláez-Moreno, Carmen},
       title = {100% Classification Accuracy Considered Harmful: The Normalized Information Transfer Factor Explains the Accuracy Paradox},
       journal = {Plos One},
       volume = {9},
       number = {1},
       ISSN = {1932-6203},
       DOI = {10.1371/journal.pone.0084217},
       url = {://WOS:000329868200022},
       year = {2014},
       type = {Journal Article}
    }

2013

  • [DOI] I. González-Díaz and F. Díaz-de-María, “A region-centered topic model for object discovery and category-based image segmentation,” Pattern Recognition, vol. 46, iss. 9, pp. 2437-2449, 2013.
    [Bibtex]
    @article{GONZALEZDIAZ20132437,
    title = "A region-centered topic model for object discovery and category-based image segmentation",
    journal = "Pattern Recognition",
    volume = "46",
    number = "9",
    pages = "2437 - 2449",
    year = "2013",
    issn = "0031-3203",
    doi = "https://doi.org/10.1016/j.patcog.2013.01.034",
    url = "http://www.sciencedirect.com/science/article/pii/S0031320313000733",
    author = "Iván González-Díaz and Fernando Díaz-de-María",
    keywords = "Latent topic models, Topic discovery, Category-based image segmentation, Kernel Logistic Regression, Context",
    abstract = "Latent topic models have become a popular paradigm in many computer vision applications due to their capability to unsupervisely discover semantics in visual content. Relying on the Bag-of-Words representation, they consider images as mixtures of latent topics that generate visual words according to some specific distributions. However, the performance of these methods is still limited by the way in which they take into account the spatial distribution of visual words and, what is even more important, the currently used appearance distributions. In this paper, we propose a novel region-centered latent topic model that introduces two main contributions: first, an improved spatial context model that allows for considering inter-topic inter-region influences; and second, an advanced region-based appearance distribution built on the Kernel Logistic Regressor. It is worth highlighting that the proposed contributions have been seamlessly integrated in the model, so that all the parameters are concurrently estimated using a unified inference process. Furthermore, the proposed model has been extended to work in both unsupervised and supervised modes. Our results for unsupervised mode improve 30\% those of previous latent topic models. For supervised mode, where discriminative approaches are preponderant, our results are quite close to those of discriminative state-of-the-art methods."
    }
  • [DOI] A. Jiménez-Moreno, E. Martínez-Enríquez, and D. F. de María, “Mode Decision-Based Algorithm for Complexity Control in H.264/AVC,” IEEE Transactions on Multimedia, vol. 15, iss. 5, pp. 1094-1109, 2013.
    [Bibtex]
    @ARTICLE{Jimenez-Moreno2013, 
    author={A. Jiménez-Moreno and E. Martínez-Enríquez and F. Díaz de María}, 
    journal={IEEE Transactions on Multimedia}, 
    title={Mode Decision-Based Algorithm for Complexity Control in H.264/AVC}, 
    year={2013}, 
    volume={15}, 
    number={5}, 
    pages={1094-1109}, 
    keywords={computational complexity;Gaussian processes;video coding;mode decision-based algorithm;complexity control;H.264-AVC video coding standard;computational complexity;complexity constraints;complexity control method;time-variant content;target complexities;binary hypothesis testing;high-complexity coding model;Gaussian statistics;probability density functions;decision threshold;JM10.2;coding efficiency;Complexity theory;Video coding;Encoding;Cost function;Standards;Signal processing algorithms;Testing;Complexity control;H.264/AVC;hypothesis testing;mode decision}, 
    doi={10.1109/TMM.2013.2241414}, 
    ISSN={1520-9210}, 
    month={Aug},}
  • [DOI] A. Gallardo-Antolín, A. I. Garc�a-Moral, Y. Pereiro-Estevan, and F. Díaz-de-María, “Design of an embedded speech-centric interface for applications in handheld terminals,” IEEE Aerospace and Electronic Systems Magazine, vol. 28, iss. 2, pp. 24-33, 2013.
    [Bibtex]
    @ARTICLE{Gallardo-Antolin2013, 
    author={A. Gallardo-Antolín and A. I. Garc�a-Moral and Y. Pereiro-Estevan and F. Díaz-de-María}, 
    journal={IEEE Aerospace and Electronic Systems Magazine}, 
    title={Design of an embedded speech-centric interface for applications in handheld terminals}, 
    year={2013}, 
    volume={28}, 
    number={2}, 
    pages={24-33}, 
    keywords={cellular radio;embedded systems;minimisation;mobile computing;notebook computers;principal component analysis;speech recognition;speech-based user interfaces;stock markets;user interface management systems;embedded speech-centric interface design;handheld terminal applications;handheld wireless device;PDA;real-time stock price access;GPRS;ASR subsystem optimisation;handheld computational resource usage minimisation;fixed-point implementation;PCA;feature vector dimensionality reduction;Servers;Speech;Speech recognition;Mobile handsets;Real-time systems;Personal digital assistants;Ground penetrating radar}, 
    doi={10.1109/MAES.2013.6477866}, 
    ISSN={0885-8985}, 
    month={Feb},}
  • [DOI] J. Cadore, F. J. Valverde-Albacete, A. Gallardo-Antolin, and C. Peláez-Moreno, “Auditory-Inspired Morphological Processing of Speech Spectrograms: Applications in Automatic Speech Recognition and Speech Enhancement,” Cognitive Computation, vol. 5, iss. 4, pp. 426-441, 2013.
    [Bibtex]
    @article{RN424,
       author = {Cadore, Joyner and Valverde-Albacete, Francisco J. and Gallardo-Antolin, Ascension and Peláez-Moreno, Carmen},
       title = {Auditory-Inspired Morphological Processing of Speech Spectrograms: Applications in Automatic Speech Recognition and Speech Enhancement},
       journal = {Cognitive Computation},
       volume = {5},
       number = {4},
       pages = {426-441},
       ISSN = {1866-9956},
       DOI = {10.1007/s12559-012-9196-6},
       url = {://WOS:000328221100003},
       year = {2013},
       type = {Journal Article}
    }
  • [DOI] A. Gallardo-Antolin, A. I. Garcia-Moral, Y. Pereiro-Estevan, and F. Díaz-de-María, “Design of an Embedded Speech-Centric Interface for Applications in Handheld Terminals,” Ieee Aerospace and Electronic Systems Magazine, vol. 28, iss. 2, pp. 24-33, 2013.
    [Bibtex]
    @article{RN427,
       author = {Gallardo-Antolin, Ascension and Garcia-Moral, Ana I. and Pereiro-Estevan, Yago and Díaz-de-María, Fernando},
       title = {Design of an Embedded Speech-Centric Interface for Applications in Handheld Terminals},
       journal = {Ieee Aerospace and Electronic Systems Magazine},
       volume = {28},
       number = {2},
       pages = {24-33},
       ISSN = {0885-8985},
       DOI = {10.1109/maes.2013.6477866},
       url = {://WOS:000318545800004},
       year = {2013},
       type = {Journal Article}
    }
  • [DOI] I. González-Díaz and F. Díaz-de-María, “A region-centered topic model for object discovery and category-based image segmentation,” Pattern Recognition, vol. 46, iss. 9, pp. 2437-2449, 2013.
    [Bibtex]
    @article{RN425,
       author = {González-Díaz, Ivan and Díaz-de-María, Fernando},
       title = {A region-centered topic model for object discovery and category-based image segmentation},
       journal = {Pattern Recognition},
       volume = {46},
       number = {9},
       pages = {2437-2449},
       ISSN = {0031-3203},
       DOI = {10.1016/j.patcog.2013.01.034},
       url = {://WOS:000318837400004},
       year = {2013},
       type = {Journal Article}
    }
  • [DOI] A. Jimenez-Moreno, E. Martinez-Enriquez, and F. Díaz-de-María, “Mode Decision-Based Algorithm for Complexity Control in H.264/AVC,” Ieee Transactions on Multimedia, vol. 15, iss. 5, pp. 1094-1109, 2013.
    [Bibtex]
    @article{RN426,
       author = {Jimenez-Moreno, Amaya and Martinez-Enriquez, Eduardo and Díaz-de-María, Fernando},
       title = {Mode Decision-Based Algorithm for Complexity Control in H.264/AVC},
       journal = {Ieee Transactions on Multimedia},
       volume = {15},
       number = {5},
       pages = {1094-1109},
       ISSN = {1520-9210},
       DOI = {10.1109/tmm.2013.2241414},
       url = {://WOS:000324763600013},
       year = {2013},
       type = {Journal Article}
    }

2012

  • [DOI] S. Sanz-Rodríguez and F. Díaz-de-María, “In-Layer Multibuffer Framework for Rate-Controlled Scalable Video Coding,” IEEE Transactions on Circuits and Systems for Video Technology, vol. 22, iss. 8, pp. 1199-1212, 2012.
    [Bibtex]
    @ARTICLE{Sanz-Rodriguez2012, 
    author={S. Sanz-Rodríguez and F. Díaz-de-María}, 
    journal={IEEE Transactions on Circuits and Systems for Video Technology}, 
    title={In-Layer Multibuffer Framework for Rate-Controlled Scalable Video Coding}, 
    year={2012}, 
    volume={22}, 
    number={8}, 
    pages={1199-1212}, 
    keywords={decoding;image reconstruction;image resolution;minimisation;video coding;in-layer multibuffer framework;rate-controlled scalable video coding;temporal scalability;hierarchical prediction structures;frame rate reduction;rate control algorithms;hypothetical reference decoder;frame rate substream;dependence layer;HRD-compliant temporal resolutions;rate-controlled SVC;virtual buffers;underflow prevention;overflow prevention;reconstructed video distortion minimization;H.264/SVC RC algorithm;variable bit rate applications;quality consistency;buffer control;advanced video coding;Static VAr compensators;Streaming media;Bit rate;Encoding;Gold;Scalability;Video coding;H.264/advanced video coding (AVC);H.264/SVC;hypothetical reference decoder (HRD);rate control (RC);scalable video coding (SVC);variable bit rate (VBR)}, 
    doi={10.1109/TCSVT.2012.2198089}, 
    ISSN={1051-8215}, 
    month={Aug},}
  • [DOI] R. Solera-Urena, A. I. Garcia-Moral, C. Pelaez-Moreno, M. Martinez-Ramon, and F. Diaz-de-Maria, “Real-Time Robust Automatic Speech Recognition Using Compact Support Vector Machines,” IEEE Transactions on Audio, Speech, and Language Processing, vol. 20, iss. 4, pp. 1347-1361, 2012.
    [Bibtex]
    @ARTICLE{Solera-Urena2012, 
    author={R. Solera-Urena and A. I. Garcia-Moral and C. Pelaez-Moreno and M. Martinez-Ramon and F. Diaz-de-Maria}, 
    journal={IEEE Transactions on Audio, Speech, and Language Processing}, 
    title={Real-Time Robust Automatic Speech Recognition Using Compact Support Vector Machines}, 
    year={2012}, 
    volume={20}, 
    number={4}, 
    pages={1347-1361}, 
    keywords={neural nets;speech coding;speech recognition;support vector machines;real-time robust automatic speech recognition;support vector machines;artificial neural networks;speech processing community;weighted least squares training procedure;real-time speech decoding;connected-digit recognition task;SpeechDat Spanish database;Hidden Markov models;Support vector machines;Training;Speech recognition;Speech;Artificial neural networks;Real-time systems;Additive noise;artificial neural network (ANN)/hidden Markov model (HMM);compact support vector machine (SVM);hybrid automatic speech recognition (ASR);machine learning;real-time ASR;robust ASR;SVM/HMM}, 
    doi={10.1109/TASL.2011.2178597}, 
    ISSN={1558-7916}, 
    month={May},}
  • [DOI] S. Sanz-Rodriguez and F. Díaz-de-María, “In-Layer Multibuffer Framework for Rate-Controlled Scalable Video Coding,” Ieee Transactions on Circuits and Systems for Video Technology, vol. 22, iss. 8, pp. 1199-1212, 2012.
    [Bibtex]
    @article{RN431,
       author = {Sanz-Rodriguez, Sergio and Díaz-de-María, Fernando},
       title = {In-Layer Multibuffer Framework for Rate-Controlled Scalable Video Coding},
       journal = {Ieee Transactions on Circuits and Systems for Video Technology},
       volume = {22},
       number = {8},
       pages = {1199-1212},
       ISSN = {1051-8215},
       DOI = {10.1109/tcsvt.2012.2198089},
       url = {://WOS:000308437500008},
       year = {2012},
       type = {Journal Article}
    }
  • [DOI] R. Solera-Urena, A. Isabel Garcia-Moral, C. Peláez-Moreno, M. Martinez-Ramon, and F. Díaz-de-María, “Real-Time Robust Automatic Speech Recognition Using Compact Support Vector Machines,” Ieee Transactions on Audio Speech and Language Processing, vol. 20, iss. 4, pp. 1347-1361, 2012.
    [Bibtex]
    @article{RN432,
       author = {Solera-Urena, Ruben and Isabel Garcia-Moral, Ana and Peláez-Moreno, Carmen and Martinez-Ramon, Manel and Díaz-de-María, Fernando},
       title = {Real-Time Robust Automatic Speech Recognition Using Compact Support Vector Machines},
       journal = {Ieee Transactions on Audio Speech and Language Processing},
       volume = {20},
       number = {4},
       pages = {1347-1361},
       ISSN = {1558-7916},
       DOI = {10.1109/tasl.2011.2178597},
       url = {://WOS:000300846100009},
       year = {2012},
       type = {Journal Article}
    }

2011

  • [DOI] E. Martinez-Enriquez, A. Jimenez-Moreno, M. Angel-Pellon, and F. Diaz-de-Maria, “A Two-Level Classification-Based Approach to Inter Mode Decision in H.264/AVC,” IEEE Transactions on Circuits and Systems for Video Technology, vol. 21, iss. 11, pp. 1719-1732, 2011.
    [Bibtex]
    @ARTICLE{Martinez-Enriquez2011, 
    author={E. Martinez-Enriquez and A. Jimenez-Moreno and M. Angel-Pellon and F. Diaz-de-Maria}, 
    journal={IEEE Transactions on Circuits and Systems for Video Technology}, 
    title={A Two-Level Classification-Based Approach to Inter Mode Decision in H.264/AVC}, 
    year={2011}, 
    volume={21}, 
    number={11}, 
    pages={1719-1732}, 
    keywords={computational complexity;video coding;two-levetwo-level classification-based approachl classification-based approach;inter mode decision;H.264/AVC standard;SKIP/direct modes;two-level classification-based approach;classifier training process;state-of-the-art fast mode decision methods;complexity reduction;video coding standard;Complexity theory;Encoding;Current measurement;Cost function;Computational efficiency;Transforms;Indexes;H.264/AVC;inter mode decision;low complexity;rate-distortion optimization}, 
    doi={10.1109/TCSVT.2011.2134010}, 
    ISSN={1051-8215}, 
    month={Nov},}
  • [DOI] S. Sanz-Rodriguez and F. Diaz-de-Maria, “RBF-Based QP Estimation Model for VBR Control in H.264/SVC,” IEEE Transactions on Circuits and Systems for Video Technology, vol. 21, iss. 9, pp. 1263-1277, 2011.
    [Bibtex]
    @ARTICLE{Sanz-Rodriguez2011, 
    author={S. Sanz-Rodriguez and F. Diaz-de-Maria}, 
    journal={IEEE Transactions on Circuits and Systems for Video Technology}, 
    title={RBF-Based QP Estimation Model for VBR Control in H.264/SVC}, 
    year={2011}, 
    volume={21}, 
    number={9}, 
    pages={1263-1277}, 
    keywords={data compression;image resolution;IPTV;radial basis function networks;television broadcasting;variable rate codes;video coding;H.264-SVC application;H.264-scalable video coding application;RBF-based QP estimation model;VBR controller;variable bit rate controller;quantization parameter value;radial basis function network;RBF network;mobile live streaming;Internet protocol television broadcast;QP encoding;constant bit rate controller;CBR controller;spatio-temporal resolution;Encoding;Static VAr compensators;Bit rate;Gold;Estimation;Complexity theory;Streaming media;H.264/advanced video coding (AVC);H.264/SVC;IPTV;rate control;scalable video coding (SVC);streaming;variable bit rate (VBR)}, 
    doi={10.1109/TCSVT.2011.2143330}, 
    ISSN={1051-8215}, 
    month={Sep.},}
  • [DOI] D. Munoz-Mejias, I. Gonzalez-Diaz, and F. Diaz-de-Maria, “A low-complexity pre-processing system for restoring low-quality QR code images,” IEEE Transactions on Consumer Electronics, vol. 57, iss. 3, pp. 1320-1328, 2011.
    [Bibtex]
    @ARTICLE{Munoz-Mejias2011, 
    author={D. Munoz-Mejias and I. Gonzalez-Diaz and F. Diaz-de-Maria}, 
    journal={IEEE Transactions on Consumer Electronics}, 
    title={A low-complexity pre-processing system for restoring low-quality QR code images}, 
    year={2011}, 
    volume={57}, 
    number={3}, 
    pages={1320-1328}, 
    keywords={decoding;display devices;image coding;image restoration;mobile handsets;low-complexity preprocessing system;low-quality QR code image restoration;low-quality quick response code image restoration;code image decoding;cell phone display device;low contrast code image;blurred code image;rotated code image;deformed code image;intrinsic quick response code characteristic;realistic database assessment;Cellular phones;Cameras;Image restoration;Indexes;Algorithm design and analysis;Filtering algorithms;Image edge detection;QR codes;low complexity;bi-tonal imagedeblurring;blind image deconvolution;cell phone}, 
    doi={10.1109/TCE.2011.6018890}, 
    ISSN={0098-3063}, 
    month={August},}
  • [DOI] D. García-García, E. Parrado-Hernández, and F. Díaz-de-María, “State-space dynamics distance for clustering sequential data,” Pattern Recognition, vol. 44, iss. 5, pp. 1014-1022, 2011.
    [Bibtex]
    @article{GARCIAGARCIA20111014,
    title = "State-space dynamics distance for clustering sequential data",
    journal = "Pattern Recognition",
    volume = "44",
    number = "5",
    pages = "1014 - 1022",
    year = "2011",
    issn = "0031-3203",
    doi = "https://doi.org/10.1016/j.patcog.2010.11.018",
    url = "http://www.sciencedirect.com/science/article/pii/S0031320310005455",
    author = "Darío García-García and Emilio Parrado-Hernández and Fernando Díaz-de-María",
    keywords = "Sequential data, Clustering, Hidden Markov models",
    abstract = "This paper proposes a novel similarity measure for clustering sequential data. We first construct a common state space by training a single probabilistic model with all the sequences in order to get a unified representation for the dataset. Then, distances are obtained attending to the transition matrices induced by each sequence in that state space. This approach solves some of the usual overfitting and scalability issues of the existing semi-parametric techniques that rely on training a model for each sequence. Empirical studies on both synthetic and real-world datasets illustrate the advantages of the proposed similarity measure for clustering sequences."
    }
  • [DOI] A. I. Garcia-Moral, R. Solera-Urena, C. Pelaez-Moreno, and F. Diaz-de-Maria, “Data Balancing for Efficient Training of Hybrid ANN/HMM Automatic Speech Recognition Systems,” IEEE Transactions on Audio, Speech, and Language Processing, vol. 19, iss. 3, pp. 468-481, 2011.
    [Bibtex]
    @ARTICLE{Garcia-Moral2011, 
    author={A. I. Garcia-Moral and R. Solera-Urena and C. Pelaez-Moreno and F. Diaz-de-Maria}, 
    journal={IEEE Transactions on Audio, Speech, and Language Processing}, 
    title={Data Balancing for Efficient Training of Hybrid ANN/HMM Automatic Speech Recognition Systems}, 
    year={2011}, 
    volume={19}, 
    number={3}, 
    pages={468-481}, 
    keywords={hidden Markov models;learning (artificial intelligence);speech recognition;data balancing;hybrid ANN/HMM automatic speech recognition;hidden Markov models;Gaussian mixture models;artificial neural networks;training set;a posteriori probability;Hidden Markov models;Automatic speech recognition;Artificial neural networks;Speech recognition;State estimation;Databases;Noise reduction;Working environment noise;Testing;Training data;Active learning;additive noise;ANN/HMM;artificial neural networks (ANNs);hidden Markov models (HMMs);hybrid automatic speech recognition (ASR);machine learning;MLP/HMM;multilayer perceptrons (MLPs);robust ASR}, 
    doi={10.1109/TASL.2010.2050513}, 
    ISSN={1558-7916}, 
    month={March},}
  • [DOI] D. Garcia-Garcia, E. Parrado-Hernandez, and F. Díaz-de-María, “State-space dynamics distance for clustering sequential data,” Pattern Recognition, vol. 44, iss. 5, pp. 1014-1022, 2011.
    [Bibtex]
    @article{RN441,
       author = {Garcia-Garcia, Dario and Parrado-Hernandez, Emilio and Díaz-de-María, Fernando},
       title = {State-space dynamics distance for clustering sequential data},
       journal = {Pattern Recognition},
       volume = {44},
       number = {5},
       pages = {1014-1022},
       ISSN = {0031-3203},
       DOI = {10.1016/j.patcog.2010.11.018},
       url = {://WOS:000287467300002},
       year = {2011},
       type = {Journal Article}
    }
  • [DOI] A. I. Garcia-Moral, R. Solera-Urena, C. Peláez-Moreno, and F. Daiz-de-María, “Data Balancing for Efficient Training of Hybrid ANN/HMM Automatic Speech Recognition Systems,” Ieee Transactions on Audio Speech and Language Processing, vol. 19, iss. 3, pp. 468-481, 2011.
    [Bibtex]
    @article{RN442,
       author = {Garcia-Moral, Ana Isabel and Solera-Urena, Ruben and Peláez-Moreno, Carmen and Daiz-de-María, Fernando},
       title = {Data Balancing for Efficient Training of Hybrid ANN/HMM Automatic Speech Recognition Systems},
       journal = {Ieee Transactions on Audio Speech and Language Processing},
       volume = {19},
       number = {3},
       pages = {468-481},
       ISSN = {1558-7916},
       DOI = {10.1109/tasl.2010.2050513},
       url = {://WOS:000291717800003},
       year = {2011},
       type = {Journal Article}
    }
  • [DOI] E. Martinez-Enriquez, A. Jimenez-Moreno, M. Angel-Pellon, and F. Díaz-de-María, “A Two-Level Classification-Based Approach to Inter Mode Decision in H.264/AVC,” Ieee Transactions on Circuits and Systems for Video Technology, vol. 21, iss. 11, pp. 1719-1732, 2011.
    [Bibtex]
    @article{RN437,
       author = {Martinez-Enriquez, Eduardo and Jimenez-Moreno, Amaya and Angel-Pellon, Miguel and Díaz-de-María, Fernando},
       title = {A Two-Level Classification-Based Approach to Inter Mode Decision in H.264/AVC},
       journal = {Ieee Transactions on Circuits and Systems for Video Technology},
       volume = {21},
       number = {11},
       pages = {1719-1732},
       ISSN = {1051-8215},
       DOI = {10.1109/tcsvt.2011.2134010},
       url = {://WOS:000296471100015},
       year = {2011},
       type = {Journal Article}
    }
  • [DOI] D. Munoz-Mejias, I. González-Díaz, and F. Díaz-de-María, “A Low-Complexity Pre-Processing System for Restoring Low-Quality QR Code Images,” Ieee Transactions on Consumer Electronics, vol. 57, iss. 3, pp. 1320-1328, 2011.
    [Bibtex]
    @article{RN439,
       author = {Munoz-Mejias, David and González-Díaz, Ivan and Díaz-de-María, Fernando},
       title = {A Low-Complexity Pre-Processing System for Restoring Low-Quality QR Code Images},
       journal = {Ieee Transactions on Consumer Electronics},
       volume = {57},
       number = {3},
       pages = {1320-1328},
       ISSN = {0098-3063},
       DOI = {10.1109/tce.2011.6018890},
       url = {://WOS:000298730900046},
       year = {2011},
       type = {Journal Article}
    }
  • [DOI] S. Sanz-Rodriguez and F. Díaz-de-María, “RBF-Based QP Estimation Model for VBR Control in H.264/SVC,” Ieee Transactions on Circuits and Systems for Video Technology, vol. 21, iss. 9, pp. 1263-1277, 2011.
    [Bibtex]
    @article{RN438,
       author = {Sanz-Rodriguez, Sergio and Díaz-de-María, Fernando},
       title = {RBF-Based QP Estimation Model for VBR Control in H.264/SVC},
       journal = {Ieee Transactions on Circuits and Systems for Video Technology},
       volume = {21},
       number = {9},
       pages = {1263-1277},
       ISSN = {1051-8215},
       DOI = {10.1109/tcsvt.2011.2143330},
       url = {://WOS:000294669900008},
       year = {2011},
       type = {Journal Article}
    }
  • [DOI] F. J. Valverde-Albacete and C. Peláez-Moreno, “Extending conceptualisation modes for generalised Formal Concept Analysis,” Information Sciences, vol. 181, iss. 10, pp. 1888-1909, 2011.
    [Bibtex]
    @article{RN440,
       author = {Valverde-Albacete, Francisco J. and Peláez-Moreno, Carmen},
       title = {Extending conceptualisation modes for generalised Formal Concept Analysis},
       journal = {Information Sciences},
       volume = {181},
       number = {10},
       pages = {1888-1909},
       ISSN = {0020-0255},
       DOI = {10.1016/j.ins.2010.04.014},
       url = {://WOS:000288833300009},
       year = {2011},
       type = {Journal Article}
    }

2010

  • [DOI] M. de-Frutos-López, D. Orellana-Quirós, J. C. Pujol-Alcolado, and F. Díaz-de-María, “An improved fast mode decision algorithm for intraprediction in H.264/AVC video coding,” Signal Processing: Image Communication, vol. 25, iss. 10, pp. 709-716, 2010.
    [Bibtex]
    @article{DEFRUTOSLOPEZ2010709,
    title = "An improved fast mode decision algorithm for intraprediction in H.264/AVC video coding",
    journal = "Signal Processing: Image Communication",
    volume = "25",
    number = "10",
    pages = "709 - 716",
    year = "2010",
    issn = "0923-5965",
    doi = "https://doi.org/10.1016/j.image.2010.10.005",
    url = "http://www.sciencedirect.com/science/article/pii/S0923596510001128",
    author = "Manuel de-Frutos-López and Daniel Orellana-Quirós and José C. Pujol-Alcolado and Fernando Díaz-de-María",
    keywords = "H.264/AVC, Intra, Mode decision, Fast intra mode decision",
    abstract = "In this article, an improved version of one of the most cited intra mode decision algorithms in H.264/AVC video coding is proposed with the aim to improve its efficiency and performance. The reference algorithm determines the interpolation/extrapolation spatial direction (mode) for achieving the best intra prediction using the Sobel gradient calculation. The proposed algorithm suggests reducing the number of gradients calculated and changing the Sobel operator to that of Roberts. In addition to this, it also proposes including the previously encoded neighboring block modes among the evaluated modes. Experimental results show that the proposed algorithm reduces the computational load of the original algorithm and substantially improves its rate-distortion performance."
    }
  • [DOI] S. Sanz-Rodriguez, O. del-Ama-Esteban, M. de-Frutos-Lopez, and F. Diaz-de-Maria, “Cauchy-Density-Based Basic Unit Layer Rate Controller for H.264/AVC,” IEEE Transactions on Circuits and Systems for Video Technology, vol. 20, iss. 8, pp. 1139-1143, 2010.
    [Bibtex]
    @ARTICLE{Sanz-Rodriguez2010, 
    author={S. Sanz-Rodriguez and O. del-Ama-Esteban and M. de-Frutos-Lopez and F. Diaz-de-Maria}, 
    journal={IEEE Transactions on Circuits and Systems for Video Technology}, 
    title={Cauchy-Density-Based Basic Unit Layer Rate Controller for H.264/AVC}, 
    year={2010}, 
    volume={20}, 
    number={8}, 
    pages={1139-1143}, 
    keywords={discrete cosine transforms;rate distortion theory;telecommunication control;video coding;basic unit layer rate controller;H.264/AVC;video coding standard;bit allocation;rate-distortion modeling;discrete cosine transform coefficient;picture quality;delay control;advanced video coding;Cauchy probability density function;rate control algorithm;Automatic voltage control;Video coding;Bit rate;Standards development;Rate-distortion;Discrete cosine transforms;Delay;Probability density function;PSNR;Fluctuations;Basic unit (BU);bit allocation;H264/advanced video coding (AVC);low-delay;rate control}, 
    doi={10.1109/TCSVT.2010.2051369}, 
    ISSN={1051-8215}, 
    month={Aug},}
  • [DOI] J. Vicente-Peña and F. Díaz-de-María, “Uncertainty decoding on Frequency Filtered parameters for robust ASR,” Speech Communication, vol. 52, iss. 5, pp. 440-449, 2010.
    [Bibtex]
    @article{VICENTEPENA2010440,
    title = "Uncertainty decoding on Frequency Filtered parameters for robust ASR",
    journal = "Speech Communication",
    volume = "52",
    number = "5",
    pages = "440 - 449",
    year = "2010",
    issn = "0167-6393",
    doi = "https://doi.org/10.1016/j.specom.2010.02.002",
    url = "http://www.sciencedirect.com/science/article/pii/S0167639310000166",
    author = "Jesús Vicente-Peña and Fernando Díaz-de-María",
    keywords = "Robust speech recognition, Spectral subtraction, Uncertainty decoding, Frequency Filtered, Bounded distance HMM, SSBD-HMM",
    abstract = "The use of feature enhancement techniques to obtain estimates of the clean parameters is a common approach for robust automatic speech recognition (ASR). However, the decoding algorithm typically ignores how accurate these estimates are. Uncertainty decoding methods incorporate this type of information. In this paper, we develop a formulation of the uncertainty decoding paradigm for Frequency Filtered (FF) parameters using spectral subtraction as a feature enhancement method. Additionally, we show that the uncertainty decoding method for FF parameters admits a simple interpretation as a spectral weighting method that assigns more importance to the most reliable spectral components. Furthermore, we suggest combining this method with SSBD-HMM (Spectral Subtraction and Bounded Distance HMM), one recently proposed technique that is able to compensate for the effects of features that are highly contaminated (outliers). This combination pursues two objectives: to improve the results achieved by uncertainty decoding methods and to determine which part of the improvements is due to compensating for the effects of outliers and which part is due to compensating for other less deteriorated features."
    }
  • [DOI] J. Vicente-Peña, F. Díaz-de-María, and B. W. Kleijn, “The synergy between bounded-distance HMM and spectral subtraction for robust speech recognition,” Speech Communication, vol. 52, iss. 2, pp. 123-133, 2010.
    [Bibtex]
    @article{VICENTEPENA2010123,
    title = "The synergy between bounded-distance HMM and spectral subtraction for robust speech recognition",
    journal = "Speech Communication",
    volume = "52",
    number = "2",
    pages = "123 - 133",
    year = "2010",
    issn = "0167-6393",
    doi = "https://doi.org/10.1016/j.specom.2009.09.002",
    url = "http://www.sciencedirect.com/science/article/pii/S0167639309001459",
    author = "Jesús Vicente-Peña and Fernando Díaz-de-María and W. Bastiaan Kleijn",
    keywords = "Robust speech recognition, Spectral subtraction, Acoustic backing-off, Bounded-distance HMM, Missing features, Outliers",
    abstract = "Additive noise generates important losses in automatic speech recognition systems. In this paper, we show that one of the causes contributing to these losses is the fact that conventional recognisers take into consideration feature values that are outliers. The method that we call bounded-distance HMM is a suitable method to avoid that outliers contribute to the recogniser decision. However, this method just deals with outliers, leaving the remaining features unaltered. In contrast, spectral subtraction is able to correct all the features at the expense of introducing some artifacts that, as shown in the paper, cause a larger number of outliers. As a result, we find that bounded-distance HMM and spectral subtraction complement each other well. A comprehensive experimental evaluation was conducted, considering several well-known ASR tasks (of different complexities) and numerous noise types and SNRs. The achieved results show that the suggested combination generally outperforms both the bounded-distance HMM and spectral subtraction individually. Furthermore, the obtained improvements, especially for low and medium SNRs, are larger than the sum of the improvements individually obtained by bounded-distance HMM and spectral subtraction."
    }
  • [DOI] E. Martinez-Enriquez, A. Jimenez-Moreno, and F. Diaz-de-Maria, “An adaptive algorithm for fast inter mode decision in the H.264/AVC video coding standard,” IEEE Transactions on Consumer Electronics, vol. 56, iss. 2, pp. 826-834, 2010.
    [Bibtex]
    @ARTICLE{Martinez-Enriquez2010, 
    author={E. Martinez-Enriquez and A. Jimenez-Moreno and F. Diaz-de-Maria}, 
    journal={IEEE Transactions on Consumer Electronics}, 
    title={An adaptive algorithm for fast inter mode decision in the H.264/AVC video coding standard}, 
    year={2010}, 
    volume={56}, 
    number={2}, 
    pages={826-834}, 
    keywords={motion estimation;standards;video coding;inter mode decision;H.264/AVC;video coding standard;motion estimation;macroblock mode decisions;adaptive mode decision method;Adaptive algorithm;Automatic voltage control;Video coding;Motion estimation;IEC standards;ISO standards;Streaming media;High definition video;Computational efficiency;Rate-distortion;H.264/AVC, rate-distortion optimization, fast inter mode decision, content adaptive, low-complexity}, 
    doi={10.1109/TCE.2010.5506008}, 
    ISSN={0098-3063}, 
    month={May},}
  • [DOI] M. de-Frutos-Lopez, D. Orellana-Quiros, J. C. Pujol-Alcolado, and F. Díaz-de-María, “An improved fast mode decision algorithm for intraprediction in H.264/AVC video coding,” Signal Processing-Image Communication, vol. 25, iss. 10, pp. 709-716, 2010.
    [Bibtex]
    @article{RN448,
       author = {de-Frutos-Lopez, Manuel and Orellana-Quiros, Daniel and Pujol-Alcolado, José C. and Díaz-de-María, Fernando},
       title = {An improved fast mode decision algorithm for intraprediction in H.264/AVC video coding},
       journal = {Signal Processing-Image Communication},
       volume = {25},
       number = {10},
       pages = {709-716},
       ISSN = {0923-5965},
       DOI = {10.1016/j.image.2010.10.005},
       url = {://WOS:000286031000001},
       year = {2010},
       type = {Journal Article}
    }
  • [DOI] E. Martinez-Enriquez, A. Jimenez-Moreno, and F. Díaz-de-María, “An Adaptive Algorithm for Fast Inter Mode Decision in the H.264/AVC Video Coding Standard,” Ieee Transactions on Consumer Electronics, vol. 56, iss. 2, pp. 826-834, 2010.
    [Bibtex]
    @article{RN452,
       author = {Martinez-Enriquez, Eduardo and Jimenez-Moreno, Amaya and Díaz-de-María, Fernando},
       title = {An Adaptive Algorithm for Fast Inter Mode Decision in the H.264/AVC Video Coding Standard},
       journal = {Ieee Transactions on Consumer Electronics},
       volume = {56},
       number = {2},
       pages = {826-834},
       ISSN = {0098-3063},
       DOI = {10.1109/tce.2010.5506008},
       url = {://WOS:000281747600081},
       year = {2010},
       type = {Journal Article}
    }
  • [DOI] M. Martinez-Ramon, A. Gallardo-Antolin, J. Cid-Sueiro, G. L. Heileman, K. Yung, W. Zheng, C. Zhao, and S. Posse, “Automatic Placement of Outer Volume Suppression Slices in MR Spectroscopic Imaging of the Human Brain,” Magnetic Resonance in Medicine, vol. 63, iss. 3, pp. 592-600, 2010.
    [Bibtex]
    @article{RN454,
       author = {Martinez-Ramon, Manel and Gallardo-Antolin, Ascension and Cid-Sueiro, Jesus and Heileman, Gregory L. and Yung, Kaung-Ti and Zheng, Weili and Zhao, Chenguang and Posse, Stefan},
       title = {Automatic Placement of Outer Volume Suppression Slices in MR Spectroscopic Imaging of the Human Brain},
       journal = {Magnetic Resonance in Medicine},
       volume = {63},
       number = {3},
       pages = {592-600},
       ISSN = {0740-3194},
       DOI = {10.1002/mrm.22275},
       url = {://WOS:000274938000007},
       year = {2010},
       type = {Journal Article}
    }
  • [DOI] C. Peláez-Moreno, A. I. Garcia-Moral, and F. J. Valverde-Albacete, “Analyzing phonetic confusions using formal concept analysis,” Journal of the Acoustical Society of America, vol. 128, iss. 3, pp. 1377-1390, 2010.
    [Bibtex]
    @article{RN449,
       author = {Peláez-Moreno, C. and Garcia-Moral, A. I. and Valverde-Albacete, F. J.},
       title = {Analyzing phonetic confusions using formal concept analysis},
       journal = {Journal of the Acoustical Society of America},
       volume = {128},
       number = {3},
       pages = {1377-1390},
       ISSN = {0001-4966},
       DOI = {10.1121/1.3458854},
       url = {://WOS:000281799800048},
       year = {2010},
       type = {Journal Article}
    }
  • [DOI] S. Sanz-Rodriguez, O. del-Ama-Esteban, M. de-Frutos-Lopez, and F. Díaz-de-María, “Cauchy-Density-Based Basic Unit Layer Rate Controller for H.264/AVC,” Ieee Transactions on Circuits and Systems for Video Technology, vol. 20, iss. 8, pp. 1139-1143, 2010.
    [Bibtex]
    @article{RN451,
       author = {Sanz-Rodriguez, Sergio and del-Ama-Esteban, Oscar and de-Frutos-Lopez, Manuel and Díaz-de-María, Fernando},
       title = {Cauchy-Density-Based Basic Unit Layer Rate Controller for H.264/AVC},
       journal = {Ieee Transactions on Circuits and Systems for Video Technology},
       volume = {20},
       number = {8},
       pages = {1139-1143},
       ISSN = {1051-8215},
       DOI = {10.1109/tcsvt.2010.2051369},
       url = {://WOS:000282976200008},
       year = {2010},
       type = {Journal Article}
    }
  • [DOI] F. J. Valverde-Albacete and C. Peláez-Moreno, “Two information-theoretic tools to assess the performance of multi-class classifiers,” Pattern Recognition Letters, vol. 31, iss. 12, pp. 1665-1671, 2010.
    [Bibtex]
    @article{RN450,
       author = {Valverde-Albacete, Francisco J. and Peláez-Moreno, Carmen},
       title = {Two information-theoretic tools to assess the performance of multi-class classifiers},
       journal = {Pattern Recognition Letters},
       volume = {31},
       number = {12},
       pages = {1665-1671},
       ISSN = {0167-8655},
       DOI = {10.1016/j.patrec.2010.05.017},
       url = {://WOS:000281368200022},
       year = {2010},
       type = {Journal Article}
    }
  • [DOI] J. Vicente-Pena and F. Díaz-de-María, “Uncertainty decoding on Frequency Filtered parameters for robust ASR,” Speech Communication, vol. 52, iss. 5, pp. 440-449, 2010.
    [Bibtex]
    @article{RN453,
       author = {Vicente-Pena, Jesus and Díaz-de-María, Fernando},
       title = {Uncertainty decoding on Frequency Filtered parameters for robust ASR},
       journal = {Speech Communication},
       volume = {52},
       number = {5},
       pages = {440-449},
       ISSN = {0167-6393},
       DOI = {10.1016/j.specom.2010.02.002},
       url = {://WOS:000277544200006},
       year = {2010},
       type = {Journal Article}
    }
  • [DOI] J. Vicente-Pena, F. Díaz-de-María, and B. W. Kleijn, “The synergy between bounded-distance HMM and spectral subtraction for robust speech recognition,” Speech Communication, vol. 52, iss. 2, pp. 123-133, 2010.
    [Bibtex]
    @article{RN455,
       author = {Vicente-Pena, Jesus and Díaz-de-María, Fernando and Kleijn, W. Bastiaan},
       title = {The synergy between bounded-distance HMM and spectral subtraction for robust speech recognition},
       journal = {Speech Communication},
       volume = {52},
       number = {2},
       pages = {123-133},
       ISSN = {0167-6393},
       DOI = {10.1016/j.specom.2009.09.002},
       url = {://WOS:000272764100004},
       year = {2010},
       type = {Journal Article}
    }

2009

  • [DOI] P. Henriquez, J. B. Alonso, M. A. Ferrer, C. M. Travieso, J. I. Godino-Llorente, and F. Diaz-de-Maria, “Characterization of Healthy and Pathological Voice Through Measures Based on Nonlinear Dynamics,” IEEE Transactions on Audio, Speech, and Language Processing, vol. 17, iss. 6, pp. 1186-1195, 2009.
    [Bibtex]
    @ARTICLE{Henriquez2009, 
    author={P. Henriquez and J. B. Alonso and M. A. Ferrer and C. M. Travieso and J. I. Godino-Llorente and F. Diaz-de-Maria}, 
    journal={IEEE Transactions on Audio, Speech, and Language Processing}, 
    title={Characterization of Healthy and Pathological Voice Through Measures Based on Nonlinear Dynamics}, 
    year={2009}, 
    volume={17}, 
    number={6}, 
    pages={1186-1195}, 
    keywords={chaos;entropy;neural nets;speech processing;pathological voice;nonlinear dynamic theory;voice recording;speech signal quality;voice production process;linear approximation;nonlinear chaotic measures;first-order Renyi entropy;second-order Renyi entropy;correlation entropy;correlation dimension;phase-space domain;mutual information function;Shannon entropy;commercial database;multiquality database;standard neural network-based classifier;healthy voice;Pathology;Databases;Entropy;Speech;Linear approximation;Chaos;Phase measurement;Mutual information;Measurement standards;Neural networks;Chaos;disordered speech;entropy;nonlinearity}, 
    doi={10.1109/TASL.2009.2016734}, 
    ISSN={1558-7916}, 
    month={Aug},}
  • [DOI] D. Garcia-Garcia, P. E. Hernandez, and F. Diaz-de-Maria, “A New Distance Measure for Model-Based Sequence Clustering,” IEEE Transactions on Pattern Analysis and Machine Intelligence, vol. 31, iss. 7, pp. 1325-1331, 2009.
    [Bibtex]
    @ARTICLE{Garcia-Garcia2009, 
    author={D. Garcia-Garcia and E. Parrado Hernandez and F. Diaz-de-Maria}, 
    journal={IEEE Transactions on Pattern Analysis and Machine Intelligence}, 
    title={A New Distance Measure for Model-Based Sequence Clustering}, 
    year={2009}, 
    volume={31}, 
    number={7}, 
    pages={1325-1331}, 
    keywords={pattern clustering;model-based sequence clustering;Kullback-Leibler divergence;model-based distances;model selection scheme;Hidden Markov models;Machine learning;Machine learning algorithms;Learning systems;Computational complexity;Clustering algorithms;Clustering methods;Proposals;Character generation;Clustering;sequential data;similarity measures.;Similarity measures;sequence clustering;Algorithms;Artificial Intelligence;Cluster Analysis;Computer Simulation;Information Storage and Retrieval;Models, Statistical;Pattern Recognition, Automated;Reproducibility of Results;Sensitivity and Specificity;Sequence Analysis}, 
    doi={10.1109/TPAMI.2008.268}, 
    ISSN={0162-8828}, 
    month={July},}
  • [DOI] D. Garcia-Garcia, E. Parrado Hernandez, and F. Díaz-de María, “A New Distance Measure for Model-Based Sequence Clustering,” Ieee Transactions on Pattern Analysis and Machine Intelligence, vol. 31, iss. 7, p. 1325-U183, 2009.
    [Bibtex]
    @article{RN459,
       author = {Garcia-Garcia, Dario and Parrado Hernandez, Emilio and Díaz-de María, Fernando},
       title = {A New Distance Measure for Model-Based Sequence Clustering},
       journal = {Ieee Transactions on Pattern Analysis and Machine Intelligence},
       volume = {31},
       number = {7},
       pages = {1325-U183},
       ISSN = {0162-8828},
       DOI = {10.1109/tpami.2008.268},
       url = {://WOS:000266188900014},
       year = {2009},
       type = {Journal Article}
    }
  • [DOI] P. Henriquez, J. B. Alonso, M. A. Ferrer, C. M. Travieso, J. I. Godino-Llorente, and F. Díaz-de-María, “Characterization of Healthy and Pathological Voice Through Measures Based on Nonlinear Dynamics,” Ieee Transactions on Audio Speech and Language Processing, vol. 17, iss. 6, pp. 1186-1195, 2009.
    [Bibtex]
    @article{RN458,
       author = {Henriquez, Patricia and Alonso, Jesus B. and Ferrer, Miguel A. and Travieso, Carlos M. and Godino-Llorente, Juan I. and Díaz-de-María, Fernando},
       title = {Characterization of Healthy and Pathological Voice Through Measures Based on Nonlinear Dynamics},
       journal = {Ieee Transactions on Audio Speech and Language Processing},
       volume = {17},
       number = {6},
       pages = {1186-1195},
       ISSN = {1558-7916},
       DOI = {10.1109/tasl.2009.2016734},
       url = {://WOS:000268039700011},
       year = {2009},
       type = {Journal Article}
    }

2008

  • [DOI] I. Gonzalez-Diaz and F. Diaz-de-Maria, “Adaptive Multipattern Fast Block-Matching Algorithm Based on Motion Classification Techniques,” IEEE Transactions on Circuits and Systems for Video Technology, vol. 18, iss. 10, pp. 1369-1382, 2008.
    [Bibtex]
    @ARTICLE{Gonzalez-Diaz2008, 
    author={I. Gonzalez-Diaz and F. Diaz-de-Maria}, 
    journal={IEEE Transactions on Circuits and Systems for Video Technology}, 
    title={Adaptive Multipattern Fast Block-Matching Algorithm Based on Motion Classification Techniques}, 
    year={2008}, 
    volume={18}, 
    number={10}, 
    pages={1369-1382}, 
    keywords={code standards;image classification;image sequences;motion estimation;video coding;adaptive multipattern fast block-matching algorithm;motion classification technique;video coding standard;motion estimation;video sequence;Video sequences;Video coding;Motion estimation;Adaptive algorithm;Robustness;MPEG 4 Standard;Dispersion;Motion detection;Computational efficiency;Costs;Binary linear classifier;block-matching;motion classification;motion estimation;multipattern algorithms}, 
    doi={10.1109/TCSVT.2008.2004917}, 
    ISSN={1051-8215}, 
    month={Oct},}
  • [DOI] I. González-Díaz and F. Díaz-de-María, “Adaptive Multipattern Fast Block-Matching Algorithm Based on Motion Classification Techniques,” Ieee Transactions on Circuits and Systems for Video Technology, vol. 18, iss. 10, pp. 1369-1382, 2008.
    [Bibtex]
    @article{RN466,
       author = {González-Díaz, Ivan and Díaz-de-María, Fernando},
       title = {Adaptive Multipattern Fast Block-Matching Algorithm Based on Motion Classification Techniques},
       journal = {Ieee Transactions on Circuits and Systems for Video Technology},
       volume = {18},
       number = {10},
       pages = {1369-1382},
       ISSN = {1051-8215},
       DOI = {10.1109/tcsvt.2008.2004917},
       url = {://WOS:000260866800005},
       year = {2008},
       type = {Journal Article}
    }
  • [DOI] J. M. Leiva-Murillo, S. Salcedo-Sanz, A. Gallardo-Antolin, and A. Artes-Rodriguez, “A simulated annealing approach to speaker segmentation in audio databases,” Engineering Applications of Artificial Intelligence, vol. 21, iss. 4, pp. 499-508, 2008.
    [Bibtex]
    @article{RN467,
       author = {Leiva-Murillo, José M. and Salcedo-Sanz, Sancho and Gallardo-Antolin, Ascension and Artes-Rodriguez, Antonio},
       title = {A simulated annealing approach to speaker segmentation in audio databases},
       journal = {Engineering Applications of Artificial Intelligence},
       volume = {21},
       number = {4},
       pages = {499-508},
       ISSN = {0952-1976},
       DOI = {10.1016/j.engappai.2007.07.002},
       url = {://WOS:000257010700001},
       year = {2008},
       type = {Journal Article}
    }
  • [DOI] F. J. Valverde-Albacete, “Extracting frame-semantics knowledge using lattice theory,” Journal of Logic and Computation, vol. 18, iss. 3, pp. 361-384, 2008.
    [Bibtex]
    @article{RN468,
       author = {Valverde-Albacete, Francisco J.},
       title = {Extracting frame-semantics knowledge using lattice theory},
       journal = {Journal of Logic and Computation},
       volume = {18},
       number = {3},
       pages = {361-384},
       ISSN = {0955-792X},
       DOI = {10.1093/logcom/exm069},
       url = {://WOS:000256173100004},
       year = {2008},
       type = {Journal Article}
    }

2007

  • [DOI] R. Solera-Ureña, D. Martín-Iglesias, A. Gallardo-Antolín, C. Peláez-Moreno, and F. Díaz-de-María, “Robust ASR using Support Vector Machines,” Speech Communication, vol. 49, iss. 4, pp. 253-267, 2007.
    [Bibtex]
    @article{SOLERAURENA2007253,
    title = "Robust ASR using Support Vector Machines",
    journal = "Speech Communication",
    volume = "49",
    number = "4",
    pages = "253 - 267",
    year = "2007",
    issn = "0167-6393",
    doi = "https://doi.org/10.1016/j.specom.2007.01.013",
    url = "http://www.sciencedirect.com/science/article/pii/S0167639307000246",
    author = "R. Solera-Ureña and D. Martín-Iglesias and A. Gallardo-Antolín and C. Peláez-Moreno and F. Díaz-de-María",
    keywords = "Robust ASR, Additive noise, Machine learning, Support Vector Machines, Kernel methods, HMM, ANN, Hybrid ASR, Dynamic Time Alignment",
    abstract = "The improved theoretical properties of Support Vector Machines with respect to other machine learning alternatives due to their max-margin training paradigm have led us to suggest them as a good technique for robust speech recognition. However, important shortcomings have had to be circumvented, the most important being the normalisation of the time duration of different realisations of the acoustic speech units. In this paper, we have compared two approaches in noisy environments: first, a hybrid HMM–SVM solution where a fixed number of frames is selected by means of an HMM segmentation and second, a normalisation kernel called Dynamic Time Alignment Kernel (DTAK) first introduced in Shimodaira et al. [Shimodaira, H., Noma, K., Nakai, M., Sagayama, S., 2001. Support vector machine with dynamic time-alignment kernel for speech recognition. In: Proc. Eurospeech, Aalborg, Denmark, pp. 1841–1844] and based on DTW (Dynamic Time Warping). Special attention has been paid to the adaptation of both alternatives to noisy environments, comparing two types of parameterisations and performing suitable feature normalisation operations. The results show that the DTA Kernel provides important advantages over the baseline HMM system in medium to bad noise conditions, also outperforming the results of the hybrid system."
    }
  • [DOI] R. Solera-Urena, D. Martin-Iglesias, A. Gallardo-Antolin, C. Peláez-Moreno, and F. Díaz-de-María, “Robust ASR using support vector machines,” Speech Communication, vol. 49, iss. 4, pp. 253-267, 2007.
    [Bibtex]
    @article{RN470,
       author = {Solera-Urena, R. and Martin-Iglesias, D. and Gallardo-Antolin, A. and Peláez-Moreno, C. and Díaz-de-María, F.},
       title = {Robust ASR using support vector machines},
       journal = {Speech Communication},
       volume = {49},
       number = {4},
       pages = {253-267},
       ISSN = {0167-6393},
       DOI = {10.1016/j.specom.2007.01.013},
       url = {://WOS:000246313700001},
       year = {2007},
       type = {Journal Article}
    }

2006

  • [DOI] J. Vicente-Peña, A. Gallardo-Antolín, C. Peláez-Moreno, and F. Díaz-de-María, “Band-pass filtering of the time sequences of spectral parameters for robust wireless speech recognition,” Speech Communication, vol. 48, iss. 10, pp. 1379-1398, 2006.
    [Bibtex]
    @article{VICENTEPENA20061379,
    title = "Band-pass filtering of the time sequences of spectral parameters for robust wireless speech recognition",
    journal = "Speech Communication",
    volume = "48",
    number = "10",
    pages = "1379 - 1398",
    year = "2006",
    issn = "0167-6393",
    doi = "https://doi.org/10.1016/j.specom.2006.07.007",
    url = "http://www.sciencedirect.com/science/article/pii/S0167639306000872",
    author = "J. Vicente-Peña and A. Gallardo-Antolín and C. Peláez-Moreno and F. Díaz-de-María",
    keywords = "Robust speech recognition, Wireless speech recognition, Transmission errors, Modulation spectrum, RASTA-PLP",
    abstract = "In this paper we address the problem of automatic speech recognition when wireless speech communication systems are involved. In this context, three main sources of distortion should be considered: acoustic environment, speech coding and transmission errors. Whilst the first one has already received a lot of attention, the last two deserve further investigation in our opinion. We have found out that band-pass filtering of the recognition features improves ASR performance when distortions due to these particular communication systems are present. Furthermore, we have evaluated two alternative configurations at different bit error rates (BER) typical of these channels: band-pass filtering the LP-MFCC parameters or a modification of the RASTA-PLP using a sharper low-pass section perform consistently better than LP-MFCC and RASTA-PLP, respectively."
    }
  • [DOI] C. Peláez-Moreno, A. Gallardo-Antolín, D. F. Gómez-Cajas, and F. Díaz-de-María, “A comparison of front-ends for bitstream-based ASR over IP,” Signal Processing, vol. 86, iss. 7, pp. 1502-1508, 2006.
    [Bibtex]
    @article{PELAEZMORENO20061502,
    title = "A comparison of front-ends for bitstream-based ASR over IP",
    journal = "Signal Processing",
    volume = "86",
    number = "7",
    pages = "1502 - 1508",
    year = "2006",
    issn = "0165-1684",
    doi = "https://doi.org/10.1016/j.sigpro.2005.08.011",
    url = "http://www.sciencedirect.com/science/article/pii/S0165168405002860",
    author = "Carmen Peláez-Moreno and Ascensión Gallardo-Antolín and Diego F. Gómez-Cajas and Fernando Díaz-de-María",
    keywords = "Robust speech recognition, Speech coding, IP networks, Coding distortion, Packet loss, LSP",
    abstract = "Automatic speech recognition (ASR) is called to play a relevant role in the provision of spoken interfaces for IP-based applications. However, as a consequence of the transit of the speech signal over these particular networks, ASR systems need to face two new challenges: the impoverishment of the speech quality due to the compression needed to fit the channel capacity and the inevitable occurrence of packet losses. In this framework, bitstream-based approaches that obtain the ASR feature vectors directly from the coded bitstream, avoiding the speech decoding process, have been proposed ([S.H. Choi, H.K. Kim, H.S. Lee, Speech recognition using quantized LSP parameters and their transformations in digital communications, Speech Commun. 30 (4) (2000) 223–233. A. Gallardo-Antolín, C. Pelàez-Moreno, F. Díaz-de-María, Recognizing GSM digital speech, IEEE Trans. Speech Audio Process., to appear. H.K. Kim, R.V. Cox, R.C. Rose, Performance improvement of a bitstream-based front-end for wireless speech recognition in adverse environments, IEEE Trans. Speech Audio Process. 10 (8) (2002) 591–604. C. Peláez-Moreno, A. Gallardo-Antolín, F. Díaz-de-María, Recognizing voice over IP networks: a robust front-end for speech recognition on the WWW, IEEE Trans. Multimedia 3(2) (2001) 209–218], among others) to improve the robustness of ASR systems. LSP (Line Spectral Pairs) are the preferred set of parameters for the description of the speech spectral envelope in most of the modern speech coders. Nevertheless, LSP have proved to be unsuitable for ASR, and they must be transformed into cepstrum-type parameters. In this paper we comparatively evaluate the robustness of the most significant LSP to cepstrum transformations in a simulated VoIP (voice over IP) environment which includes two of the most popular codecs used in that network (G.723.1 and G.729) and several network conditions. In particular, we compare ‘pseudocepstrum’ [H.K. Kim, S.H. Choi, H.S. Lee, On approximating Line Spectral Frequencies to LPC cepstral coefficients, IEEE Trans. Speech Audio Process. 8 (2) (2000) 195–199], an approximated but straightforward transformation of LSP into LP cepstral coefficients, with a more computationally demanding but exact one. Our results show that pseudocepstrum is preferable when network conditions are good or computational resources low, while the exact procedure is recommended when network conditions become more adverse."
    }
  • [DOI] C. Peláez-Moreno, A. Gallardo-Antolin, D. F. Gomez-Cajas, and F. Díaz-De-María, “A comparison of front-ends for bitstream-based ASR over IP,” Signal Processing, vol. 86, iss. 7, pp. 1502-1508, 2006.
    [Bibtex]
    @article{RN478,
       author = {Peláez-Moreno, Carmen and Gallardo-Antolin, Ascensin and Gomez-Cajas, Diego F. and Díaz-De-María, Fernando},
       title = {A comparison of front-ends for bitstream-based ASR over IP},
       journal = {Signal Processing},
       volume = {86},
       number = {7},
       pages = {1502-1508},
       ISSN = {0165-1684},
       DOI = {10.1016/j.sigpro.2005.08.011},
       url = {://WOS:000237769300013},
       year = {2006},
       type = {Journal Article}
    }
  • [DOI] S. Salcedo-Sanz, A. Gallardo-Antolin, J. M. Leiva-Murillo, and C. Bousono-Calzon, “Offline speaker segmentation using genetic algorithms and mutual information,” Ieee Transactions on Evolutionary Computation, vol. 10, iss. 2, pp. 175-186, 2006.
    [Bibtex]
    @article{RN479,
       author = {Salcedo-Sanz, S. and Gallardo-Antolin, A. and Leiva-Murillo, J. M. and Bousono-Calzon, C.},
       title = {Offline speaker segmentation using genetic algorithms and mutual information},
       journal = {Ieee Transactions on Evolutionary Computation},
       volume = {10},
       number = {2},
       pages = {175-186},
       ISSN = {1089-778X},
       DOI = {10.1109/tevc.2005.857079},
       url = {://WOS:000236814000007},
       year = {2006},
       type = {Journal Article}
    }
  • [DOI] J. Vicente-Pena, A. Gallardo-Antolin, C. Peláez-Moreno, and F. Díaz-de-María, “Band-pass filtering of the time sequences of spectral parameters for robust wireless speech recognition,” Speech Communication, vol. 48, iss. 10, pp. 1379-1398, 2006.
    [Bibtex]
    @article{RN477,
       author = {Vicente-Pena, J. and Gallardo-Antolin, A. and Peláez-Moreno, C. and Díaz-de-María, F.},
       title = {Band-pass filtering of the time sequences of spectral parameters for robust wireless speech recognition},
       journal = {Speech Communication},
       volume = {48},
       number = {10},
       pages = {1379-1398},
       ISSN = {0167-6393},
       DOI = {10.1016/j.specom.2006.07.007},
       url = {://WOS:000241586500011},
       year = {2006},
       type = {Journal Article}
    }

2005

  • [DOI] A. Gallardo-Antolin, C. Pelaez-Moreno, and F. Diaz-de-Maria, “Recognizing GSM digital speech,” IEEE Transactions on Speech and Audio Processing, vol. 13, iss. 6, pp. 1186-1205, 2005.
    [Bibtex]
    @ARTICLE{Gallardo-Antolin2005, 
    author={A. Gallardo-Antolin and C. Pelaez-Moreno and F. Diaz-de-Maria}, 
    journal={IEEE Transactions on Speech and Audio Processing}, 
    title={Recognizing GSM digital speech}, 
    year={2005}, 
    volume={13}, 
    number={6}, 
    pages={1186-1205}, 
    keywords={speech recognition;cellular radio;combined source-channel coding;speech coding;speech codecs;feature extraction;quantisation (signal);decoding;code standards;distortion;radio networks;digital speech recognition;GSM network;global system for mobile;source coding distortion;error transmission;feature extraction;speech encoding;quantization distortion;decoding process;bit allocation;full-rate standard codec;tandeming;wireless network;Speech recognition;GSM;Automatic speech recognition;Source coding;Feature extraction;Working environment noise;Decoding;Quantization;Code standards;Codecs;Coding distortion;Global System for Mobile (GSM) networks;speech coding;speech recognition;tandeming;transmission errors;wireless networks}, 
    doi={10.1109/TSA.2005.853210}, 
    ISSN={1063-6676}, 
    month={Nov},}
  • [DOI] A. Gallardo-Antolin, C. Peláez-Moreno, and F. Díaz-de-María, “Recognizing GSM digital speech,” Ieee Transactions on Speech and Audio Processing, vol. 13, iss. 6, pp. 1186-1205, 2005.
    [Bibtex]
    @article{RN483,
       author = {Gallardo-Antolin, A. and Peláez-Moreno, C. and Díaz-de-María, F.},
       title = {Recognizing GSM digital speech},
       journal = {Ieee Transactions on Speech and Audio Processing},
       volume = {13},
       number = {6},
       pages = {1186-1205},
       ISSN = {1063-6676},
       DOI = {10.1109/tsa.2005.853210},
       url = {://WOS:000232734500009},
       year = {2005},
       type = {Journal Article}
    }

2003

  • F. J. Valverde-Albacete, R. Pedraza-Jimenez, H. Molina-Bulla, J. Cid-Sueiro, P. Díaz-Perez, and A. Navia-Vazquez, “InterMediActor: an environment for instructional content design based on competences,” Educational Technology & Society, vol. 6, iss. 4, pp. 30-47, 2003.
    [Bibtex]
    @article{RN488,
       author = {Valverde-Albacete, F. J. and Pedraza-Jimenez, R. and Molina-Bulla, H. and Cid-Sueiro, J. and Díaz-Perez, P. and Navia-Vazquez, A.},
       title = {InterMediActor: an environment for instructional content design based on competences},
       journal = {Educational Technology & Society},
       volume = {6},
       number = {4},
       pages = {30-47},
       ISSN = {1436-4522},
       url = {://WOS:000189152100005},
       year = {2003},
       type = {Journal Article}
    }

2001

  • [DOI] C. Pelaez-Moreno, A. Gallardo-Antolin, and F. Diaz-de-Maria, “Recognizing voice over IP: a robust front-end for speech recognition on the world wide web,” IEEE Transactions on Multimedia, vol. 3, iss. 2, pp. 209-218, 2001.
    [Bibtex]
    @ARTICLE{ Pelaez-Moreno2001, 
    author={C. Pelaez-Moreno and A. Gallardo-Antolin and F. Diaz-de-Maria}, 
    journal={IEEE Transactions on Multimedia}, 
    title={Recognizing voice over IP: a robust front-end for speech recognition on the world wide web}, 
    year={2001}, 
    volume={3}, 
    number={2}, 
    pages={209-218}, 
    keywords={speech recognition;speech coding;Internet;information resources;Internet telephony;error handling;decoding;encoding;protocols;robust front-end;speech recognition;world wide web;Internet protocol environment;lossy speech coding;packet loss;recognition feature vectors;encoded speech;quantization distortion;encoding-decoding process;ITU G.723.1 standard codec;automatic speech recognition;speaker-independent isolated digit recognition;speaker-independent continuous speech recognition;simulated packet loss rates;Speech recognition;Internet telephony;Robustness;Automatic speech recognition;Feature extraction;Codecs;Protocols;Speech coding;IP networks;Decoding}, 
    doi={10.1109/6046.923820}, 
    ISSN={1520-9210}, 
    month={June},}
  • [DOI] C. Peláez-Moreno, A. Gallardo-Antolin, and F. Díaz-De-María, “Recognizing voice aver IP: A robust front-end for speech recognition on the World Wide Web,” Ieee Transactions on Multimedia, vol. 3, iss. 2, pp. 209-218, 2001.
    [Bibtex]
    @article{RN492,
       author = {Peláez-Moreno, C. and Gallardo-Antolin, A. and Díaz-De-María, F.},
       title = {Recognizing voice aver IP: A robust front-end for speech recognition on the World Wide Web},
       journal = {Ieee Transactions on Multimedia},
       volume = {3},
       number = {2},
       pages = {209-218},
       ISSN = {1520-9210},
       DOI = {10.1109/6046.923820},
       url = {://WOS:000173707800004},
       year = {2001},
       type = {Journal Article}
    }

1997

  • F. Díaz-de-María and A. R. Figueiras-Vidal, “Improving CELP coders by backward adaptive non-linear prediction,” International Journal of Adaptive Control and Signal Processing, vol. 11, iss. 7, pp. 585-601, 1997.
    [Bibtex]
    @article{Diaz-de-Maria1997,
    author = {Díaz-de-María, Fernando and Figueiras-Vidal, Aníbal R.},
    title = {Improving CELP coders by backward adaptive non-linear prediction},
    journal = {International Journal of Adaptive Control and Signal Processing},
    volume = {11},
    number = {7},
    pages = {585-601},
    keywords = {RBF network, non-linear prediction, speech coding, backward adaptation},
    doi = {10.1002/(SICI)1099-1115(199711)11:7<585::AID-ACS454>3.0.CO;2-9},
    url = {https://onlinelibrary.wiley.com/doi/abs/10.1002/%28SICI%291099-1115%28199711%2911%3A7%3C585%3A%3AAID-ACS454%3E3.0.CO%3B2-9},
    eprint = {https://onlinelibrary.wiley.com/doi/pdf/10.1002/%28SICI%291099-1115%28199711%2911%3A7%3C585%3A%3AAID-ACS454%3E3.0.CO%3B2-9},
    abstract = {Abstract Non-linear prediction is a natural way to increase the quality of speech coders. In particular, low-delay CELP-type coders can incorporate this improvement because the predictor adaptation is backward. Consequently, there is the possibility of using neural networks as predictors, since their weights (usually a larger number than required in the linear approach) do not have to be transmitted. We apply a radial basis function (RBF) network for this purpose since it computes a regularized solution to the prediction problem. As a result, the stability of the non-linear autoregressive synthesis system can be guaranteed. Investigations of how to combine non-linear predictors with linear predictors indicate that a cascade of an RBF network and a linear filter is a suitable selection since it provides good results and its application to analysis-by-synthesis coders results in large computational advantages with respect to the parallel configuration. This hybrid predictor has been tested for a low-delay code-excited predictive coder, providing an average improvement of 0·4 dB with respect to a CELP coder. Additionally, subjective listening tests give the proposed coder a slight preference over the CELP coder. These results are encouraging because we consider that the proposed coder can be implemented in real time after some improvements, which are detailed as the subject of further work. © 1997 John Wiley \& Sons. Ltd.},,
    year = {1997}
    }
  • F. DíazdeMaría and A. R. FigueirasVidal, “Improving CELP coders by backward adaptive non-linear prediction,” International Journal of Adaptive Control and Signal Processing, vol. 11, iss. 7, pp. 585-601, 1997.
    [Bibtex]
    @article{RN494,
       author = {DíazdeMaría, F. and FigueirasVidal, A. R.},
       title = {Improving CELP coders by backward adaptive non-linear prediction},
       journal = {International Journal of Adaptive Control and Signal Processing},
       volume = {11},
       number = {7},
       pages = {585-601},
       ISSN = {0890-6327},
       DOI = {10.1002/(sici)1099-1115(199711)11:7<585::aid-acs454>3.0.co;2-9},
       url = {://WOS:A1997YD76000003},
       year = {1997},
       type = {Journal Article}
    }

Comments are closed.