Florian Müller

Former Research Associate

Publications

2013

  • Müller, F. and Mertins, A.: Feature Extraction with a Multiscale Modulation Anaysis for Robust Automatic Speech Recognition in Proc. Int. Conf. Audio, Speech, and Signal Processing, Vancouver, Canada, May, 2013
    BibTeX
    @INPROCEEDINGS{Muller-ICASSP-2013,
      author = {Florian M\"uller and Alfred Mertins},
      title = {Feature Extraction with a Multiscale Modulation Anaysis for Robust
    	Automatic Speech Recognition},
      booktitle = {Proc. Int. Conf. Audio, Speech, and Signal Processing},
      year = {2013},
      address = {Vancouver, Canada},
      month = {May}
    }

2012

  • Müller, F. and Mertins, A.: On Using the Auditory Image Model and Invariant-Integration for Noise Robust Automatic Speech Recognition in Proc. Int. Conf. Audio, Speech, and Signal Processing, pp. 4905-4908, Kyoto, Japan, Mar., 2012
    BibTeX
    @INPROCEEDINGS{Muller2012,
      author = {Florian M{\"u}ller and Alfred Mertins},
      title = {On Using the Auditory Image Model and Invariant-Integration for Noise
    	Robust Automatic Speech Recognition},
      booktitle = {Proc. Int. Conf. Audio, Speech, and Signal Processing},
      year = {2012},
      address = {Kyoto, Japan},
      pages = {4905-4908},
      month = {Mar.}
    }
  • Müller, F. and Mertins, A.: On the Use of a Wave-Reflection Model for the Estimation of Spectral Effects due to Vocal Tract Length Changes with Application to Automatic Speech Recognition in Proc. 38th German Annual Conference on Acoustics (DAGA 2012), Darmstadt, Germany, Mar., 2012
    BibTeX
    @INPROCEEDINGS{Muller2012a,
      author = {Florian M{\"u}ller and Alfred Mertins},
      title = {On the Use of a Wave-Reflection Model for the Estimation of Spectral
    	Effects due to Vocal Tract Length Changes with Application to Automatic
    	Speech Recognition},
      booktitle = {Proc. 38th German Annual Conference on Acoustics (DAGA 2012)},
      year = {2012},
      address = {Darmstadt, Germany},
      month = {Mar.}
    }
  • Müller, F. and Mertins, A.: Enhancing Vocal Tract Length Normalization with Elastic Registration for Automatic Speech Recognition in Proc. Interspeech-2012, Portland, USA, Sept., 2012
    BibTeX Datei
    @INPROCEEDINGS{Muller2012b,
      author = {Florian M{\"u}ller and Alfred Mertins},
      title = {Enhancing Vocal Tract Length Normalization with Elastic Registration
    	for Automatic Speech Recognition},
      booktitle = {Proc. Interspeech-2012},
      year = {2012},
      pages = {},
      address = {Portland, USA},
      month = {Sept.}
    }
  • Müller, F. and Mertins, A.: Dereverberation with an Iterative Least-Squares Technique and Minimum Mean-Square Error Estimation for Automatic Speech Recognition in Proc. ITG Fachtagung Sprachkommunikation, Braunschweig, Germany, Sept., 2012
    BibTeX Datei
    @INPROCEEDINGS{Muller2012c,
      author = {Florian M{\"u}ller and Alfred Mertins},
      title = {Dereverberation with an Iterative Least-Squares Technique and Minimum
    	Mean-Square Error Estimation for Automatic Speech Recognition},
      booktitle = {Proc. ITG Fachtagung Sprachkommunikation},
      year = {2012},
      address = {Braunschweig, Germany},
      month = {Sept.}
    }

2011

  • Müller, F. and Mertins, A.: Robust Continuous Speech Recognition through Combination of Invariant-Feature Based Systems in Proc. German Conf. Speech Signal Processing (ESSV 2011), pp. 229-236, Aachen, Germany, Sept., 2011
    BibTeX Datei
    @INPROCEEDINGS{Muller2011a,
      author = {Florian M{\"u}ller and Alfred Mertins},
      title = {Robust Continuous Speech Recognition through Combination of Invariant-Feature
    	Based Systems},
      booktitle = {Proc. German Conf. Speech Signal Processing (ESSV 2011)},
      year = {2011},
      pages = {229-236},
      address = {Aachen, Germany},
      month = {Sept.}
    }
  • Müller, F. and Mertins, A.: Noise Robust Speaker-Independent Speech Recognition with Invariant-Integration Features Using Power-Bias Subtraction in Proc. Interspeech-2011, pp. 1677-1680, Florence, Italy, Aug., 2011
    BibTeX
    @INPROCEEDINGS{Muller2011b,
      author = {Florian M{\"u}ller and Alfred Mertins},
      title = {Noise Robust Speaker-Independent Speech Recognition with Invariant-Integration
    	Features Using Power-Bias Subtraction},
      booktitle = {Proc. Interspeech-2011},
      year = {2011},
      pages = {1677-1680},
      address = {Florence, Italy},
      month = {Aug.}
    }
  • Müller, F. and Mertins, A.: Contextual invariant-integration features for improved speaker-independent speech recognition Speech Communication, vol. 53, no. 6, pp. 830 - 841, 2011
    BibTeX Link Link
    @ARTICLE{Muller2011,
      author = {Florian M{\"u}ller and Alfred Mertins},
      title = {Contextual invariant-integration features for improved speaker-independent
    	speech recognition},
      journal = {Speech Communication},
      year = {2011},
      volume = {53},
      pages = {830 - 841},
      number = {6},
      abstract = {This work presents a feature-extraction method that is based on the
    	theory of invariant integration. The invariant-integration features
    	are derived from an extended time period, and their computation has
    	a very low complexity. Recognition experiments show a superior performance
    	of the presented feature type compared to cepstral coefficients using
    	a mel filterbank (MFCCs) or a gammatone filterbank (GTCCs) in matching
    	as well as in mismatching training-testing conditions. Even without
    	any speaker adaptation, the presented features yield accuracies that
    	are larger than for MFCCs combined with vocal tract length normalization
    	(VTLN) in matching training-test conditions. Also, it is shown that
    	the invariant-integration features (IIFs) can be successfully combined
    	with additional speaker-adaptation methods to further increase the
    	accuracy. In addition to standard MFCCs also contextual MFCCs are
    	introduced. Their performance lies between the one of MFCCs and IIFs.},
      doi = {http://dx.doi.org/10.1016/j.specom.2011.02.002},
      issn = {0167-6393},
      keywords = {Speech recognition}
    }

2010

  • Müller, F. and Mertins, A.: Robust Features for Speaker-Independent Speech Recognition Based on a Certain Class of Translation-Invariant Transformations in Advances in Nonlinear Speech Processing, vol. 5933, pp. 111-119, Springer, LNAI, Heidelberg, Germany, Feb., 2010
    BibTeX
    @INPROCEEDINGS{Muller2010,
      author = {Florian M{\"u}ller and Alfred Mertins},
      title = {Robust Features for Speaker-Independent Speech Recognition Based
    	on a Certain Class of Translation-Invariant Transformations},
      booktitle = {Advances in Nonlinear Speech Processing},
      year = {2010},
      editor = {Jordi Sole-Casals and Vladimir Zaiats},
      volume = {5933},
      series = {LNAI},
      pages = {111-119},
      address = {Heidelberg, Germany},
      month = {Feb.},
      publisher = {Springer},
      isbn = {978-3-642-11508-0}
    }
    
    
  • Müller, F. and Mertins, A.: Invariant Integration Features Combined with Speaker-Adaptation Methods in Proc. Int. Conf. Spoken Language Processing (Interspeech 2010-ICSLP), pp. 2622--2625, Makuhari, Japan, Sept., 2010
    BibTeX
    @INPROCEEDINGS{Muller2010a,
      author = {Florian M{\"u}ller and Alfred Mertins},
      title = {Invariant Integration Features Combined with Speaker-Adaptation Methods},
      booktitle = {Proc. Int. Conf. Spoken Language Processing (Interspeech 2010-ICSLP)},
      year = {2010},
      address = {Makuhari, Japan},
      month = {Sept.},
      pages = {2622--2625},
      abstract = {Speaker-normalization and -adaptation methods are essential components
    	of state-of-the-art speech recognition systems nowadays. Recently,
    	so-called invariant integration features were presented which are
    	motivated by the theory of invariants. While it was shown that the
    	integration features outperform MFCCs when used with a basic monophone
    	recognition system, it was left open, if their benefits still can
    	be observed when a more sophisticated recognition system with speaker-normalization
    	and/or speaker-adaptation components is used. This work investigates
    	the combination of the integration features with standard speaker-normalization
    	and -adaptation methods. We show that the integration features benefit
    	from adaptation methods and significantly outperform MFCCs in matching,
    	as well as in mismatching training-test conditions.},
      keywords = {Speaker independency, invariant integration, speaker normalization, speaker adaptation}
    }
    
  • Condurache, A. P., Müller, F. and Mertins, A.: An LDA-based relative hysteresis classifier with application to segmentation of retinal vessels in Proc. Int. Conf. Pattern Recognition (ICPR), pp. 4202--4205, Istanbul, Turkey, Sept., 2010
    BibTeX
    @INPROCEEDINGS{Condurache2010,
      author = {A. P. Condurache and F. M{\"u}ller and A. Mertins},
      title = {An LDA-based relative hysteresis classifier with application to segmentation
    	of retinal vessels},
      booktitle = {Proc. Int. Conf. Pattern Recognition (ICPR)},
      year = {2010},
      address = {Istanbul, Turkey},
      month = {Sept.},
      pages = {4202--4205},
      abstract = {In a pattern classification setup, image segmentation is achieved
    	by assigning each pixel to one of two classes: object or background.
    	The special case of vessel segmentation is characterized by a strong
    	disproportion between the number of representatives of each class
    	(i.e. class skew) and also by a strong overlap between classes. These
    	difficulties can be solved using problem-specific knowledge. The
    	proposed hysteresis classification makes use of such knowledge in
    	an efficient way. We describe a novel, supervised, hysteresisbased
    	classification method that we apply to the segmentation of retina
    	photographies. This procedure is fast and achieves results that comparable
    	or even superior to other hysteresis methods and, for the problem
    	of retina vessel segmentation, to known dedicated methods on similar
    	data sets.}
    }

2009

  • Müller, F. and Mertins, A.: Nonlinear translation-invariant transformations for speaker-independent speech recognition in ISCA Tutorial and Research Workshop on Non-Linear Speech Processing (NOLISP'09), Vic, Spain, Jun., 2009
    BibTeX
    @INPROCEEDINGS{Muller2009,
      author = {Florian M{\"u}ller and Alfred Mertins},
      title = {Nonlinear translation-invariant transformations for speaker-independent
    	speech recognition},
      booktitle = {ISCA Tutorial and Research Workshop on Non-Linear Speech Processing (NOLISP'09)},
      year = {2009},
      address = {Vic, Spain},
      month = {Jun.}
    }
    
  • Müller, F. and Mertins, A.: Invariant-integration method for robust feature extraction in speaker-independent speech recognition in Proc. Interspeech 2009, Brighton, Sept., 2009
    BibTeX
    @INPROCEEDINGS{Muller2009a,
      author = {Florian M{\"u}ller and Alfred Mertins},
      title = {Invariant-integration method for robust feature extraction in speaker-independent
    	speech recognition},
      booktitle = {Proc. Interspeech 2009},
      year = {2009},
      address = {Brighton},
      month = {Sept.}
    }
  • Müller, F., Belilovsky, E. and Mertins, A.: Generalized Cyclic Transformations in Speaker-Independent Speech Recognition in Proc. 2009 IEEE Automatic Speech Recognition and Understanding Workshop, Merano, Italy, Dec. 13-17, 2009
    BibTeX
    @INPROCEEDINGS{Muller2009b,
      author = {Florian M{\"u}ller and Eugene Belilovsky and Alfred Mertins},
      title = {Generalized Cyclic Transformations in Speaker-Independent Speech
    	Recognition},
      booktitle = {Proc. 2009 IEEE Automatic Speech Recognition and Understanding Workshop},
      year = {2009},
      address = {Merano, Italy},
      month = {Dec. 13-17}
    }
    

2008

  • Kabus, S., Müller, F., Wiemker, R. and Fischer, B.: Robust lung nodule growth measurement by combining registration and segmentation in Proceedings of the First International Workshop on Pulmonary Image Analysis, pp. 15 -- 23, New York, USA, Sept., 2008
    BibTeX
    @INPROCEEDINGS{Kabus2008,
      author = {Sven Kabus and Florian M{\"u}ller and Rafael Wiemker and Bernd Fischer},
      title = {Robust lung nodule growth measurement by combining registration and
    	segmentation},
      booktitle = {Proceedings of the First International Workshop on Pulmonary Image
    	Analysis},
      year = {2008},
      pages = {15 -- 23},
      address = {New York, USA},
      month = {Sept.}
    }
    

2005

  • Wesker, T., Meyer, B., Wagener, K., Anemüller, J., Mertins, A. and Kollmeier, B.: Oldenburg Logatome Speech Corpus {(OLLO)} for Speech Recognition Experiments with Humans and Machines in Proc. Interspeech 2005, pp. 1273-1276, Lisbon, Portugal, Sept., 2005
    BibTeX
    @INPROCEEDINGS{OLLO-05,
      author = {Thorsten Wesker and Bernd Meyer and Kirsten Wagener and J{\"o}rn Anem{\"u}ller
    	and Alfred Mertins and Birger Kollmeier},
      title = {Oldenburg Logatome Speech Corpus {(OLLO)} for Speech Recognition
    	Experiments with Humans and Machines},
      booktitle = {Proc. Interspeech 2005},
      year = {2005},
      pages = {1273-1276},
      address = {Lisbon, Portugal},
      month = {Sept.}
    }

1999

  • Dippel, S., Stahl, M., Aach, T., Buzug, T. M., Wiemker, R., Neitzel, U., Müller, E. and Haas, J. P.: Rauschrobuste Verbesserung schwacher Strukturen in digitalen Radiographien durch nichtlineare Multiskalen-Filterung in Bildverarbeitung für die Medizin 1999, pp. 21-25, Springer-Verlag, 1999
    BibTeX
    @INPROCEEDINGS{DIP99a,
      author = {S. Dippel and M. Stahl and T. Aach and T. M. Buzug and R. Wiemker
    	and U. Neitzel and E. M{\"u}ller and J. P. Haas},
      title = {Rauschrobuste Verbesserung schwacher Strukturen in digitalen Radiographien
    	durch nichtlineare Multiskalen-Filterung},
      booktitle = {Bildverarbeitung für die Medizin 1999},
      year = {1999},
      editor = {Evers and Glombitza and Lehmann and Meinzer},
      pages = {21-25},
      publisher = {Springer-Verlag}
    }
    
  • Müller, E., Aach, T., Buzug, T. M., Dippel, S., Stahl, M., Wiemker, R. and Haas, J. P.: First Clinical Experiences with Noise-Resistant Non-Linear Multiscale Processing in European Congress on Radiology, Wien, March 1999, 1999
    BibTeX
    @INPROCEEDINGS{MUE99a,
      author = {E. M{\"u}ller and T. Aach and T. M. Buzug and S. Dippel and M. Stahl
    	and R. Wiemker and J. P. Haas},
      title = {First Clinical Experiences with Noise-Resistant Non-Linear Multiscale
    	Processing},
      booktitle = {European Congress on Radiology},
      year = {1999},
      address = {Wien},
      month = {March 1999}
    }