Preprints

  1. X. Alameda-Pineda, V. Drouard, and R. Horaud, Variational Inference and Learning of Piecewise-linear Dynamical Systems, 2020. [ bib pdf arxiv ]
    @unpublished{Alameda-TNNLS-2020,
      title={Variational Inference and Learning of Piecewise-linear Dynamical Systems},
      author={Xavier Alameda-Pineda  and Vincent Drouard and Radu Horaud},
      year={2020},
      note={Submitted to IEEE Transactions on Neural Networks and Learning Systems},
      arxiv={https://arxiv.org/abs/2006.01668},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-TNNLS-2020.pdf}
    }
  2. G. Delorme, Y. Ban, G. Sarrazin, and X. Alameda-Pineda, ODA-Track: Online Deep Appearance for Robotic Multiple Person Tracking, 2020. [ bib ]
    @unpublished{Delorme-ICRA-2020,
    author={Guillaume Delorme and Yutong Ban and Guillaume Sarrazin and Xavier Alameda-Pineda},
    title={ODA-Track: Online Deep Appearance for Robotic Multiple Person Tracking},
    year={2020},
    }
  3. L. Girin, S. Leglaive, X. Bie, J. Diard, T. Hueber, and X. Alameda-Pineda, Dynamical Variational Autoencoders: A Comprehensive Review, 2020. [ bib pdf ]
    @unpublished{Girin-DVAE-2020,
      title={Dynamical Variational Autoencoders: A Comprehensive Review},
      author={Girin, Laurent and Leglaive, Simon and Bie, Xiaoyu and Diard, Julien and Hueber, Thomas and Alameda-Pineda, Xavier},
      journal={arXiv preprint arXiv:2008.12595},
      year={2020},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Girin-DVAE-2020.pdf}
    }
  4. Y. Liu, M. D. Nadai, J. Yao, N. Sebe, B. Lepri, and X. Alameda-Pineda, GMM-UNIT: Unsupervised Multi-Domain and Multi-Modal Image-to-Image Translation via Attribute Gaussian Mixture Modeling, 2020. [ bib arxiv ]
    @unpublished{Liu-2020,
    author={Yahui Liu and Marco De Nadai and Jian Yao and Nicu Sebe and Bruno Lepri and Xavier Alameda-Pineda},
    title={GMM-UNIT: Unsupervised Multi-Domain and Multi-Modal Image-to-Image Translation via Attribute Gaussian Mixture Modeling},
    year={2020},
    arxiv={https://arxiv.org/abs/2003.06788},
    }
  5. V. Nguyen, M. Sadeghi, E. Ricci, and X. Alameda-Pineda, Deep Variational Generative Models for Audio-visual Speech Separation, 2020. [ bib pdf ]
    @unpublished{Nguyen-2020,
      title={Deep Variational Generative Models for Audio-visual Speech Separation},
      author={Nguyen, Viet-Nhat and Sadeghi, Mostafa and Ricci, Elisa and Alameda-Pineda, Xavier},
      journal={arXiv preprint arXiv:2008.07191},
      year={2020},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Nguyen-2020.pdf}
    }
  6. M. Sadeghi and X. Alameda-Pineda, Mixture of Inference Networks for VAE-based Audio-visual Speech Enhancement, 2020. [ bib arxiv ]
    @unpublished{Sadeghi-2020-TSP,
    title={Mixture of Inference Networks for VAE-based Audio-visual Speech Enhancement},
    author={Mostafa Sadeghi and Xavier Alameda-Pineda},
    year={2020},
    arxiv={https://arxiv.org/abs/1912.10647},
    note={Submitted to IEEE TSP},
    }

Books

  1. X. Alameda-Pineda, E. Ricci, and N. Sebe, Multimodal Behavior Analysis in the Wild: Advances and Challenges, Elsevier, 2018. [ bib ]
    @book{Alameda-Ricci-Sebe,
      author    = {Xavier Alameda-Pineda and Elisa Ricci and Nicu Sebe}, 
      title     = {Multimodal Behavior Analysis in the Wild: Advances and Challenges},
      publisher = {Elsevier},
      year      = {2018},
    }

Patents

  1. N. Sebe, X. Alameda-Pineda, S. Tulyakov, E. Ricci, L. Yin, and J. F. Cohn, “Self-adaptive matrix completion for heart rate estimation from face videos under realistic conditions,” , iss. US 15631346, 2017. [ bib ]
    @patent{Sebe-Patent-2017,
     author = {Nicu Sebe and Xavier Alameda-Pineda and Sergey Tulyakov and Elisa Ricci and Lijun Yin and Jeffrey F. Cohn},
     title = {Self-adaptive matrix completion for heart rate estimation from face videos under realistic conditions},
     year = {2017},
     number = {US 15631346},
     type = {Patent Application},
    }

Book Chapters

  1. X. Alameda-Pineda, E. Ricci, and N. Sebe, “Multimodal analysis of free-standing conversational groups,” in Frontiers of Multimedia Research, S. Chang, Ed., Morgan and Claypool, 2017, pp. 51-74. [ bib ]
    @incollection{Alameda-BookMM-2017,
      author      = {Xavier Alameda-Pineda and Elisa Ricci and Nicu Sebe},
      title       = {Multimodal analysis of free-standing conversational groups},
      editor      = {Shih-Fu Chang},
      booktitle   = {Frontiers of Multimedia Research},
      publisher   = {Morgan and Claypool},
      year        = 2017,
      pages        = {51-74},
    }
  2. X. Alameda-Pineda, E. Ricci, and N. Sebe, “Multimodal behavior analysis in the wild: an introduction,” in Multimodal behavior analysis in the wild, X. Alameda-Pineda, E. Ricci, and N. Sebe, Eds., Elsevier, 2018, pp. 1-10. [ bib ]
    @incollection{alameda2018multimodal-intro,
      author      = "Xavier Alameda-Pineda and Elisa Ricci and Nicu Sebe",
      title       = "Multimodal behavior analysis in the wild: an introduction",
      editor      = "Xavier Alameda-Pineda and Elisa Ricci and Nicu Sebe",
      booktitle   = "Multimodal behavior analysis in the wild",
      publisher   = "Elsevier",
      year        = 2018,
      pages       = "1-10",
      chapter     = 1,
    }
  3. X. Alameda-Pineda, R. Subramanian, E. Ricci, O. Lanz, and N. Sebe, “SALSA: A multimodal dataset for the automated analysis of free-standing social interactions,” in Group and Crowd Behavior for Computer Vision, V. Murino, M. Cristani, S. Shah, and S. Savarese, Eds., Elsevier, 2016. [ bib ]
    @incollection{Alameda-BookCBA-2016,
      author      = {Xavier Alameda-Pineda and Ramanathan Subramanian and Elisa Ricci and Oswald Lanz and Nicu Sebe},
      title       = {SALSA: A multimodal dataset for the automated analysis of free-standing social interactions},
      editor      = {Vittorio Murino and Marco Cristani and Shishir Shah and Silvio Savarese},
      booktitle   = {Group and Crowd Behavior for Computer Vision},
      year        = 2016,
      publisher   = {Elsevier},
    }

Journal Articles

2020

  1. Y. Ban, X. Alameda-Pineda, L. Girin, and R. Horaud, “Variational Bayesian Inference for Audio-Visual Tracking of Multiple Speakers,” IEEE Transactions on Pattern Analysis and Machine Intelligence, 2020. [ bib pdf arxiv ]
    @article{Ban-TPAMI-2020,
      title={Variational Bayesian Inference for Audio-Visual Tracking of Multiple Speakers},
      author={Yutong Ban and Xavier Alameda-Pineda and Laurent Girin and Radu Horaud},
      year={2020},
      journal={IEEE Transactions on Pattern Analysis and Machine Intelligence},
      doi={10.1109/TPAMI.2019.2953020},
      arxiv={https://arxiv.org/abs/1809.10961},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Ban-TPAMI-2020.pdf}
    }
  2. M. Sadeghi, S. Leglaive, X. Alameda-Pineda, L. Girin, and R. Horaud, “Audio-visual Speech Enhancement Using Conditional Variational Auto-Encoders,” IEEE Transactions on Audio, Language and Signal Processing, 2020. [ bib pdf arxiv ]
    @article{Sadeghi-TASLP-2020,
    title={Audio-visual Speech Enhancement Using Conditional Variational Auto-Encoders},
    author={Mostafa Sadeghi and Simon Leglaive and Xavier Alameda-Pineda and Laurent Girin and Radu Horaud},
    year={2020},
    journal={IEEE Transactions on Audio, Language and Signal Processing},
    doi={10.1109/TASLP.2020.3000593},
    arxiv={https://arxiv.org/abs/1908.02590},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Sadeghi-TASLP-2020.pdf}
    }
  3. W. Wang, X. Alameda-Pineda, D. Xu, E. Ricci, and N. Sebe, “Learning How to Smile: Expression Video Generation with Conditional Adversarial Recurrent Nets,” IEEE Transactions on Multimedia, 2020. [ bib pdf ]
    @article{Wang-TMM-2020.bib,
    title={Learning How to Smile: Expression Video Generation with Conditional Adversarial Recurrent Nets},
    author={Wei Wang and Xavier Alameda-Pineda and Dan Xu and Elisa Ricci and Nicu Sebe},
    journal={IEEE Transactions on Multimedia},
    year={2020},
    doi={10.1109/TMM.2019.2963621},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Wang-TMM-2020.pdf}
    }

2019

  1. Y. Ban, X. Alameda-Pineda, C. Evers, and R. Horaud, “Tracking Multiple Audio Sources with the Von Mises Distribution and Variational EM,” IEEE Signal Processing Letters, vol. 26, iss. 6, pp. 798-802, 2019. [ bib pdf ]
    @article{Ban-SPL-2019,
      title={Tracking Multiple Audio Sources with the Von Mises Distribution and Variational EM},
      author={Y. Ban and X. Alameda-Pineda and C. Evers and R. Horaud},
      journal={IEEE Signal Processing Letters},
      year={2019},
      volume={26},
        number={6},
        pages={798--802},
      doi={10.1109/LSP.2019.2908376},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Ban-SPL-2019.pdf}
    }
  2. S. Lathuilière, P. Mesejo, X. Alameda-Pineda, and R. Horaud, “A Comprehensive Analysis of Deep Regression,” IEEE Transactions on Pattern Analysis and Machine Intelligence, 2019. [ bib pdf arxiv ]
    @article{Lathuiliere-TPAMI-2019,
      title={A Comprehensive Analysis of Deep Regression},
      author={St\`ephane Lathuili\`ere and Pablo Mesejo and Xavier Alameda-Pineda and Radu Horaud},
      journal={IEEE Transactions on Pattern Analysis and Machine Intelligence},
      year={2019},
      arxiv={https://arxiv.org/abs/1803.08450},
      code={https://github.com/Stephlat/DeepRegression},
      doi={10.1109/TPAMI.2019.2910523},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Lathuiliere-TPAMI-2019.pdf}
    }
  3. X. Li, Y. Ban, L. Girin, X. Alameda-Pineda, and R. Horaud, “Online Localization and Tracking of Multiple Moving Speakers in Reverberant Environment,” IEEE Journal of Selected Topics in Signal Processing, iss. 1, pp. 88-103, 2019. [ bib pdf arxiv ]
    @article{Li-JSTSP-2019,
      title={Online Localization and Tracking of Multiple Moving Speakers in Reverberant Environment},
      author={Xiaofei Li and Yutong Ban and Laurent Girin and Xavier Alameda-Pineda and Radu Horaud},
      journal={IEEE Journal of Selected Topics in Signal Processing},
      volumne=13,
      number=1,
      year={2019},
      pages={88--103},
      arxiv={https://arxiv.org/abs/1809.10936},
      doi={10.1109/JSTSP.2019.2903472},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Li-JSTSP-2019.pdf}
    }
  4. A. Siarohin, G. Zen, C. Majtanovic, X. Alameda-Pineda, E. Ricci, and N. Sebe, “Increasing Image Memorability with Neural Style Transfer,” ACM Transactions on Multimedia Computing Communications and Applications, 2019. [ bib pdf ]
    @article{Siarohin-TOMM-2019,
      title={Increasing Image Memorability with Neural Style Transfer},
      author={A Siarohin and G. Zen and C Majtanovic and X. Alameda-Pineda and E. Ricci and N. Sebe},
      journal={ACM Transactions on Multimedia Computing Communications and Applications},
      year={2019},
      doi={10.1145/3311781},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Siarohin-TOMM-2019.pdf}
    }

2018

  1. D. Xu, X. Alameda-Pineda, J. Song, E. Ricci, and N. Sebe, “Cross-Paced Representation Learning with Partial Curricula for Sketch-based Image Retrieval,” IEEE Transactions on Image Processing, 2018. [ bib pdf arxiv ]
    @article{Xu-TIP-2018,
      title={Cross-Paced Representation Learning with Partial Curricula for Sketch-based Image Retrieval},
      author={Dan Xu and Xavier Alameda-Pineda and Jingkuan Song and Elisa Ricci and Nicu Sebe},
      journal={IEEE Transactions on Image Processing},
      year={2018},
      arxiv={https://arxiv.org/abs/1803.01504},
      doi={10.1109/TIP.2018.2837381},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Xu-TIP-2018.pdf}
    }

2017

  1. D. Fabre, T. Hueber, L. Girin, X. Alameda-Pineda, and P. Badin, “Automatic Animation of an Articulatory Tongue Model from Ultrasound Images of the Vocal Tract,” Speech Communications, vol. 93, pp. 63-75, 2017. [ bib pdf ]
    @article{Fabre-SpeechCom-2017,
      title={Automatic Animation of an Articulatory Tongue Model from Ultrasound Images of the Vocal Tract},
      author={Diandra Fabre and Thomas Hueber and Laurent Girin and Xavier Alameda-Pineda and Pierre Badin},
      journal={Speech Communications},
      year={2017},
      volume={93},
      pages={63--75},
      doi={10.1016/j.specom.2017.08.002},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Fabre-SpeechCom-2017.pdf}
    }
  2. L. Girin, T. Hueber, and X. Alameda-Pineda, “Extending the Cascaded Gaussian Mixture Regression Framework for Cross-Speaker Acoustic-Articulatory Mapping,” IEEE/ACM Transactions on Audio, Speech, and Language Processing, 2017. [ bib pdf ]
    @article{Girin-TASLP-2017,
      author={L. Girin and T. Hueber and X. Alameda-Pineda},
      journal={IEEE/ACM Transactions on Audio, Speech, and Language Processing},
      title={Extending the Cascaded Gaussian Mixture Regression Framework for Cross-Speaker Acoustic-Articulatory Mapping},
      year={2017},
      doi={10.1109/TASLP.2017.2651398},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Girin-TASLP-2017.pdf}
    }

2016

  1. X. Alameda-Pineda, J. Staiano, R. Subramanian, L. M. Batrinca, E. Ricci, B. Lepri, O. Lanz, and N. Sebe, “SALSA: A Novel Dataset for Multimodal Group Behavior Analysis,” IEEE Transactions on Pattern Analysis and Machine Intelligence, vol. 38, iss. 8, pp. 1707-1720, 2016. [ bib pdf data arxiv ]
    @article{Alameda-TPAMI-2016,
      author    = {Xavier Alameda-Pineda and
                   Jacopo Staiano and
                   Ramanathan Subramanian and
                   Ligia Maria Batrinca and
                   Elisa Ricci and
                   Bruno Lepri and
                   Oswald Lanz and
                   Nicu Sebe},
      title     = {{SALSA:} {A} Novel Dataset for Multimodal Group Behavior Analysis},
      journal   = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
      year      = {2016},
      volume={38},
      number={8},
      pages={1707-1720},
      data    = {http://tev.fbk.eu/salsa},
      arxiv = {http://arxiv.org/abs/1506.06882},
      doi  = {10.1109/TPAMI.2015.2496269},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-TPAMI-2016.pdf}
    }
  2. S. Ba, X. Alameda-Pineda, A. Xompero, and R. Horaud, “An On-line Variational Bayesian Model for Multi-Person Tracking from Cluttered Scenes,” Computer Vision and Image Understanding, vol. 153, pp. 64-76, 2016. [ bib pdf arxiv ]
    @article{Ba-CVIU-2016,
      title = {An On-line Variational Bayesian Model for Multi-Person Tracking from Cluttered Scenes},
      author = {Sileye Ba and Xavier Alameda-Pineda and Alessio Xompero and Radu Horaud},
      journal = {Computer Vision and Image Understanding},
      year={2016},
      volume = {153},
      number={},
      pages = {64-76},
      url = {http://arxiv.org/abs/1509.01520},
      arxiv = {http://arxiv.org/abs/1509.01520},
      doi={10.1016/j.cviu.2016.07.006},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Ba-CVIU-2016.pdf}
    }
  3. I. Gebru, X. Alameda-Pineda, F. Forbes, and R. Horaud, “EM algorithms for weighted-data clustering with application to audio-visual scene analysis,” IEEE Transactions on Pattern Analysis and Machine Intelligence, vol. 38, iss. 12, pp. 2402-2415, 2016. [ bib pdf code data arxiv ]
    @article{Gebru-TPAMI-2016,
       title = {{EM} algorithms for weighted-data clustering with application to audio-visual scene analysis},
       author = {Israel-Dejene Gebru and Xavier Alameda-Pineda and Florence Forbes and Radu Horaud},
       journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
       year={2016},
       volume={38},
       number={12},
       pages={2402-2415},
       url = {http://arxiv.org/abs/1509.01509},
       arxiv = {http://arxiv.org/abs/1509.01509},
       doi={10.1109/TPAMI.2016.2522425},
       soft={http://perception.inrialpes.fr/people/Gebru/code/WD-EM.zip},
       data={https://team.inria.fr/perception/avtrack1/},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Gebru-TPAMI-2016.pdf}
    }
  4. D. Kounades-Bastian, L. Girin, X. Alameda-Pineda, S. Gannot, and R. Horaud, “A Variational EM Algorithm for the Separation of Time-Varying Convolutive Audio Mixtures,” IEEE/ACM Transactions on Audio, Speech and Language Processing, vol. 24, iss. 8, pp. 1408-1423, 2016. [ bib pdf arxiv ]
    @article{Kounades-TASLP-2016,
      title={A Variational {EM} Algorithm for the Separation of Time-Varying Convolutive Audio Mixtures},
      author = {Dionyssos Kounades-Bastian and Laurent Girin and Xavier Alameda-Pineda and Sharon Gannot and Radu Horaud},
      journal = {IEEE/ACM Transactions on Audio, Speech and Language Processing},
      year = {2016},
      url = {http://arxiv.org/abs/1510.04595},
      arxiv = {http://arxiv.org/abs/1510.04595},
      volume={24},
      number={8},
      pages={1408-1423},
      doi={10.1109/TASLP.2016.2554286},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Kounades-TASLP-2016.pdf}
    }

2015

  1. X. Alameda-Pineda and R. Horaud, “Vision-Guided Robot Hearing,” International Journal of Robotics Research, vol. 34, iss. 4-5, pp. 437-456, 2015. [ bib pdf code arxiv ]
    @article{Alameda-IJRR-2014,
      author    = {Xavier Alameda-Pineda and Radu Horaud},
      title     = {Vision-Guided Robot Hearing},
      journal   = {{International Journal of Robotics Research}},
      volume  = {34},
      number  = {4-5},
      pages    = {437--456},
      year    = {2015},
      arxiv = {http://arxiv.org/abs/1311.2460},
      soft = {https://code.humavips.eu},
      doi={10.1177/0278364914548050},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-IJRR-2014.pdf}
    }
  2. T. Hueber, L. Girin, X. Alameda-Pineda, and G. Bailly, “Speaker-Adaptive Acoustic-Articulatory Inversion using Cascaded Gaussian Mixture Regression,” IEEE/ACM Transactions on Audio, Speech and Language Processing, vol. 23, iss. 12, pp. 2246-2259, 2015. [ bib pdf ]
    @article{Hueber-TASLP-2015,
      title={Speaker-Adaptive Acoustic-Articulatory Inversion using Cascaded Gaussian Mixture Regression},
      author={Hueber, Thomas and Girin, Laurent and Alameda-Pineda, Xavier and Bailly, Gerard},
      year={2015},
      journal={IEEE/ACM Transactions on Audio, Speech and Language Processing},
      volume={23},
      number={12},
      pages={2246-2259},
      doi={10.1109/TASLP.2015.2464702},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Hueber-TASLP-2015.pdf}
    }

2014

  1. X. Alameda-Pineda and R. Horaud, “A Geometric Approach to Sound Source Localization from Time-Delay Estimates,” IEEE Transactions on Audio, Speech and Language Processing, vol. 22, iss. 6, pp. 1082-1095, 2014. [ bib pdf code arxiv ]
    @article{Alameda-TASLP-2014,
      author    = {Xavier Alameda-Pineda and Radu Horaud},
      title     = {A Geometric Approach to Sound Source Localization from Time-Delay Estimates},
      journal   = {{IEEE Transactions on Audio, Speech and Language Processing}},
      year      = {2014},
      volume   = {22}, 
      number   = {6}, 
      pages   = {1082-1095},
      arxiv = {http://arxiv.org/abs/1311.1047},
      soft = {https://team.inria.fr/perception/the-gtde-matlab-toolbox/},
      doi={10.1109/TASLP.2014.2317989},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-TASLP-2014.pdf}
    }

2013

  1. X. Alameda-Pineda, J. Sanchez-Riera, J. Wienke, V. Franc, J. Cech, K. Kulkarni, A. Deleforge, and R. Horaud, “RAVEL: An Annotated Corpus for Training Robots with Audiovisual Abilities,” Journal on Multimodal User Interfaces, vol. 7, iss. 1-2, pp. 79-91, 2013. [ bib pdf data ]
    @Article{Alameda-JMUI-2012,
      author       = "Alameda-Pineda, Xavier and Sanchez-Riera, Jordi and Wienke, Johannes and Franc, Vojtech and Cech, Jan and Kulkarni, Kaustubh and Deleforge, Antoine and Horaud, Radu",
      title        = "RAVEL: An Annotated Corpus for Training Robots with Audiovisual Abilities",
      journal      = "Journal on Multimodal User Interfaces",
      volume       = "7",
      number       = "1-2",
      pages        = "79-91",
      year         = "2013",
      data         = "http://ravel.humavips.eu",
      doi = {10.1007/s12193-012-0111-y},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-JMUI-2012.pdf}
    }

Conferences and Workshops

2020

  1. G. Delorme, Y. Xu, S. Lathuilière, R. Horaud, and X. Alameda-Pineda, “CANU-ReID: A Conditional Adversarial Network for Unsupervised person Re-IDentification,” in IEEE International Conference on Pattern Recognition, 2020. [ bib pdf arxiv ]
    @inproceedings{Delorme-ICPR-2020,
    title={CANU-ReID: A Conditional Adversarial Network for Unsupervised person Re-IDentification},
    author={Guillaume Delorme and Yihong Xu and Stephane Lathuili\`{e}re and Radu Horaud and Xavier Alameda-Pineda},
    year=2020,
    booktitle={IEEE International Conference on Pattern Recognition},
    arxiv={https://arxiv.org/abs/1904.01308},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Delorme-ICPR-2020.pdf}
    }
  2. S. Leglaive, X. Alameda-Pineda, L. Girin, and R. Horaud, “A Recurrent Variational Autoencoder for Speech Enhancement,” in IEEE International Conference on Audio, Speech and Signal Processing, 2020. [ bib pdf arxiv ]
    @inproceedings{Leglaive-ICASSP-2020,
    title={A Recurrent Variational Autoencoder for Speech Enhancement},
    author={Simon Leglaive and Xavier Alameda-Pineda and Laurent Girin and Radu Horaud},
    booktitle={IEEE International Conference on Audio, Speech and Signal Processing},
    year={2020},
    arxiv={https://arxiv.org/abs/1910.10942},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Leglaive-ICASSP-2020.pdf}
    }
  3. Y. Liu, M. D. Nadai, D. Cai, H. Li, X. Alameda-Pineda, N. Sebe, and B. Lepri, “Describe What to Change: A Text-guided Unsupervised Image-to-image Translation Approach ,” in ACM International Conference on Multimedia, 2020. [ bib pdf ]
    @inproceedings{Liu-ACMMM-2020,
    author={Yahui Liu and Marco De Nadai and Deng Cai and Huayang Li and Xavier Alameda-Pineda and
    Nicu Sebe and Bruno Lepri},
    title={Describe What to Change: A Text-guided Unsupervised Image-to-image Translation Approach
    },
    year={2020},
    booktitle={ACM International Conference on Multimedia},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Liu-ACMMM-2020.pdf}
    }
  4. M. Sadeghi and X. Alameda-Pineda, “Robust Unsupervised Audio-visual Speech Enhancement Using a Mixture of Variational Autoencoders,” in IEEE International Conference on Audio, Speech and Signal Processing, Barcelona, Spain, 2020. [ bib pdf arxiv ]
    @inproceedings{Sadeghi-ICASSP-2020,
    author={Mostafa Sadeghi and Xavier Alameda-Pineda},
    title={Robust Unsupervised Audio-visual Speech Enhancement Using a Mixture of Variational Autoencoders},
    booktitle={IEEE International Conference on Audio, Speech and Signal Processing},
    address={Barcelona, Spain},
    year={2020},
    arxiv={https://arxiv.org/abs/1911.03930},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Sadeghi-ICASSP-2020.pdf}
    }
  5. Y. Xu, A. Osep, Y. Ban, R. Horaud, L. Leal-Taixé, and X. Alameda-Pineda, “How to Train Your Deep Multi-Object Tracker,” in IEEE International Conference on Computer Vision and Pattern Recognition, Seatle,USA, 2020. [ bib pdf arxiv ]
    @inproceedings{Xu-CVPR-2020,
    title={How to Train Your Deep Multi-Object Tracker},
    author={Yihong Xu and Aljosa Osep and Yutong Ban and Radu Horaud and Laura Leal-Taixé and Xavier Alameda-Pineda},
    year={2020},
    arxiv={https://arxiv.org/abs/1906.06618},
    booktitle={IEEE International Conference on Computer Vision and Pattern Recognition},
    address={Seatle,USA},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Xu-CVPR-2020.pdf}
    }

2019

  1. X. Alameda-Pineda, S. Arias, Y. Ban, G. Delorme, L. Girin, R. Horaud, X. Li, B. Mourgue, and G. Sarrazin, “Audio-Visual Variational Fusion for Multi-Person Tracking with Robots,” in ACM Multimedia, Nice, France, 2019. [ bib pdf ]
    @inproceedings{Alameda-ACMMM-2019,
    title={Audio-Visual Variational Fusion for Multi-Person Tracking with Robots},
    author={Xavier Alameda-Pineda and Soraya Arias and Yutong Ban and Guillaume Delorme and Laurent Girin and Radu Horaud and Xiaofei Li and Bastien Mourgue and Guillaume Sarrazin},
    booktitle={ACM Multimedia},
    year=2019,
    address={Nice, France},
    doi={3343031.3350590},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-ACMMM-2019.pdf}
    }
  2. X. Alameda-Pineda, M. Redi, E. Celis, N. Sebe, and S. Chang, “FAT/MM’19: 1st International Workshop on Fairness, Accountability, and Transparency in MultiMedia,” in ACM MM, Nice, France, 2019. [ bib pdf ]
    @inproceedings{Alameda-FATMM-2019,
    title={FAT/MM'19: 1st International Workshop on Fairness, Accountability, and Transparency in MultiMedia},
    author={Xavier Alameda-Pineda and Miriam Redi and Elisa Celis and Nicu Sebe and Shih-Fu Chang},
    booktitle={ACM MM},
    year={2019},
    address={Nice, France},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-FATMM-2019.pdf}
    }
  3. M. G. Constantin, B. Ionescu, C. Demarty, N. Q. Duong, X. Alameda-Pineda, and M. Sjöberg, “Predicting Media Memorability Task at MediaEval 2019,” in MediaEval 2019 Workshop, 2019. [ bib pdf ]
    @inproceedings{Constantin-MediaEval-2019,
      title={Predicting Media Memorability Task at MediaEval 2019},
      author={Mihai Gabriel Constantin and Bogdan Ionescu and Claire-H\'el\`ene Demarty and Ngoc QK Duong and Xavier Alameda-Pineda and Mats Sj\"oberg},
      year={2019},
      booktitle={MediaEval 2019 Workshop},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Constantin-MediaEval-2019.pdf}
    }

2018

  1. X. Alameda-Pineda, M. Redi, N. Sebe, S. Chang, and J. Luo, “ACM MM’18 Workshop on Understanding Subjective Attributes of Data, Multimodal Recognition of Evoked Emotions,” in ACM International Conference on Multimedia, Seoul, Korea, 2018. [ bib pdf ]
    @inproceedings{Alameda-EEUSAD-2018,
    author={Xavier Alameda-Pineda and Miriam Redi and Nicu Sebe and Shih-Fu Chang and Jiebo Luo},
    title={ACM MM'18 Workshop on Understanding Subjective Attributes of Data, Multimodal Recognition of Evoked Emotions},
    booktitle={ACM International Conference on Multimedia},
    address={Seoul, Korea},
    year=2018,
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-EEUSAD-2018.pdf}
    }
  2. Y. Ban, X. Li, X. Alameda-Pineda, L. Girin, and R. Horaud, “Accounting for Room Acoustics in Audio-Visual Multi-Speaker Tracking,” in IEEE International Conference on Audio, Speech and Signal Processing, 2018. [ bib pdf ]
    @inproceedings{Ban-ICASSP-2018,
    title={Accounting for Room Acoustics in Audio-Visual Multi-Speaker Tracking},
    author={Yutong Ban and Xiaofei Li and Xavier Alameda-Pineda and Laurent Girin and Radu Horaud},
    booktitle={IEEE International Conference on Audio, Speech and Signal Processing},
    year={2018},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Ban-ICASSP-2018.pdf}
    }
  3. S. Lathuilière, P. Mesejo, X. Alameda-Pineda, and R. Horaud, “DeepGUM: Learning Deep Robust Regression with a Gaussian-Uniform Mixture Model,” in European Conference on Computer Vision, Munich, Germany, 2018. [ bib pdf ]
    @inproceedings{lathuiliere-ECCV-2018,
      author={St\'ephane Lathuili\`ere and Pablo Mesejo and Xavier Alameda-Pineda and Radu Horaud},
      title={DeepGUM: Learning Deep Robust Regression with a Gaussian-Uniform Mixture Model},
      booktitle={European Conference on Computer Vision},
      address={Munich, Germany},
      year={2018},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Lathuiliere-ECCV-2018.pdf}
    }
  4. X. Li, Y. Ban, L. Girin, X. Alameda-Pineda, and R. Horaud, “A cascaded multiple-speaker localization and tracking system,” in International Workshop on Acoustic Signal Enhancement (IWAENC), LOCATA Satellite Workshop, Tokyo, Japan, 2018. [ bib pdf ]
    @inproceedings{Li-IWAENC-2018,
      author={X. Li and Y. Ban and L. Girin and X. Alameda-Pineda and R. Horaud},
      title={A cascaded multiple-speaker localization and tracking system},
      booktitle={International Workshop on Acoustic Signal Enhancement (IWAENC), LOCATA Satellite Workshop},
      year={2018},
      address={Tokyo, Japan},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Li-IWAENC-2018.pdf}
    }
  5. W. Wei, X. Alameda-Pineda, D. Xu, E. Ricci, and N. Sebe, “Every Smile is Unique: Landmark-Guided Diverse Smile Generation,” in IEEE International Conference on Computer Vision and Pattern Recognition, Salt Lake City, USA, 2018. [ bib pdf arxiv ]
    @inproceedings{Wang-CVPR-2018,
      title={Every Smile is Unique: Landmark-Guided Diverse Smile Generation},
      author={Wei, Wang and Alameda-Pineda, Xavier and Xu, Dan and Ricci, Elisa and Sebe, Nicu},
      booktitle={IEEE International Conference on Computer Vision and Pattern Recognition},
      year={2018},
      arxiv={http://arxiv.org/abs/1802.01873/},
      address={Salt Lake City, USA},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Wang-CVPR-2018.pdf}
    }

2017

  1. X. Alameda-Pineda, A. Pilzer, D. Xu, N. Sebe, and E. Ricci, “Viraliency: Pooling Local Viraliry,” in IEEE International Conference on Computer Vision and Pattern Recognition, Hawai, USA, 2017. [ bib pdf code arxiv ]
    @inproceedings{Alameda-CVPR-2017,
    title={Viraliency: Pooling Local Viraliry},
    author={Xavier Alameda-Pineda and Andrea Pilzer and Dan Xu and Nicu Sebe and Elisa Ricci},
    booktitle={IEEE International Conference on Computer Vision and Pattern Recognition},
    year={2017},
    address={Hawai, USA},
    soft={https://github.com/xavirema/lena_pooling},
    arxiv={https://arxiv.org/abs/1703.03937},
    doi={10.1109/CVPR.2017.59},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-CVPR-2017.pdf}
    }
  2. X. Alameda-Pineda, M. Redi, M. Soleymani, N. Sebe, S. Chang, and S. Gosling, “MUSA2 — First ACM Workshop on Multimodal Understanding of Social, Affective and Subjective Attributes,” in ACM Multimedia, Mountain View, USA, 2017. [ bib pdf ]
    @inproceedings{Alameda-MUSA2-2017,
    author = {Xavier Alameda-Pineda and Miriam Redi and Mohammad Soleymani and Nicu Sebe and Shih-Fu Chang and Samuel Gosling},
    title = {MUSA2 -- First ACM Workshop on Multimodal Understanding of Social, Affective and Subjective Attributes},
    booktitle = {ACM Multimedia},
    year = {2017},
    address = {Mountain View, USA},
    doi={10.1145/3123266.3132057},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-MUSA2-2017.pdf}
    }
  3. Y. Ban, L. Girin, X. Alameda-Pineda, and R. Horaud, “Exploiting the Complementarity of Audio-Visual Data for Probabilistic Multi-Speaker Tracking,” in IEEE ICCV Workshop on Computer Vision for Audio-Visual Media, Venice, Italy, 2017. [ bib pdf ]
    @inproceedings{Ban-CVAVM-2017,
    author = {Yutong Ban and Laurent Girin and Xavier Alameda-Pineda and Radu Horaud},
    title = {Exploiting the Complementarity of Audio-Visual Data for Probabilistic Multi-Speaker Tracking},
    booktitle = {IEEE ICCV Workshop on Computer Vision for Audio-Visual Media}, 
    year = {2017},
    address = {Venice, Italy},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Ban-CVAVM-2017.pdf}
    }
  4. Y. Ban, X. Alameda-Pineda, F. Badeig, S. Ba, and R. Horaud, “Tracking a Varying Number of People with a Visually-Controlled Robotic Head,” in Intelligent Robots and Systems, Vancouver,Canada, 2017. [ bib pdf ]
    Award Novel Technology Paper Award Finalist
    @inproceedings{Ban-IROS-2017,
      title={Tracking a Varying Number of People with a Visually-Controlled Robotic Head},
      author={Yutong Ban and Xavier Alameda-Pineda and Fabien Badeig and Sileye Ba and Radu Horaud},
      booktitle={Intelligent Robots and Systems},
      award={Novel Technology Paper Award Finalist},
      year={2017},
      address={Vancouver,Canada},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Ban-IROS-2017.pdf}
    }
  5. L. Girin, T. Hueber, and X. Alameda-Pineda, “Adaptation of a Gaussian Mixture Regressor to a New Input Distribution: Extending the C-GMR Framework,” in International Conference on Latent Variable Analysis and Signal Separation, Grenoble, France, 2017. [ bib pdf ]
    @inproceedings{Girin-LVA-2017,
      title={Adaptation of a {G}aussian Mixture Regressor to a New Input Distribution: Extending the {C-GMR} Framework},
      author={Laurent Girin and Thomas Hueber and Xavier Alameda-Pineda},
      year={2017},
      booktitle={International Conference on Latent Variable Analysis and Signal Separation},
      address={Grenoble, France},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Girin-LVA-2017.pdf}
    }
  6. D. Kounades-Bastian, L. Girin, X. Alameda-Pineda, R. Horaud, and S. Gannot, “Exploting the Intermittency of Speech for Joint Separation and Diarization,” in IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, New Paltz, USA, 2017. [ bib pdf ]
    @inproceedings{Kounades-WASPAA-2017,
    author = {Dionyssos Kounades-Bastian and Laurent Girin and Xavier Alameda-Pineda and Radu Horaud and Sharon Gannot},
    title = {Exploting the Intermittency of Speech for Joint Separation and Diarization},
    booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics},
    year = {2017},
    address = {New Paltz, USA},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Kounades-WASPAA-2017.pdf}
    }
  7. A. Siarohin, G. Zen, C. Majtanovic, X. Alameda-Pineda, E. Ricci, and N. Sebe, “How to Make an Image More Memorable? A Deep Style Transfer Approach,” in ACM International Conference on Multimedia Retrieval, Bucharest, Romania, 2017. [ bib pdf ]
    @inproceedings{Siarohin-ICMR-2017,
      author = {Aliaksandr Siarohin and Gloria Zen and Cveta Majtanovic and Xavier Alameda-Pineda and Elisa Ricci and Nicu Sebe},
      title = {How to Make an Image More Memorable? A Deep Style Transfer Approach},
      booktitle = {ACM International Conference on Multimedia Retrieval},
      year = {2017},
      address = {Bucharest, Romania},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Siarohin-ICMR-2017.pdf}
    }
  8. D. Xu, W. Ouyang, X. Alameda-Pineda, E. Ricci, X. Wang, and N. Sebe, “Learning Deep Structured Multi-Scale Features using Attention-Gated CRFs for Contour Prediction,” in Advances in Neural Information Processing Systems, Long Beach, USA, 2017. [ bib pdf ]
    @inproceedings{Xu-NIPS-2017,
      title={Learning Deep Structured Multi-Scale Features using Attention-Gated CRFs for Contour Prediction},
      author={Dan Xu and Wanli Ouyang and Xavier Alameda-Pineda and Elisa Ricci and Xiaogang Wang and Nicu Sebe},
      booktitle={Advances in Neural Information Processing Systems},
      year={2017},
      address={Long Beach, USA},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Xu-NIPS-2017.pdf}
    }
  9. D. Kounades-Bastian, L. Girin, X. Alameda-Pineda, S. Gannot, and R. Horaud, “An EM algorithm for joint source separation and diarisation of multichannel convolutive mixtures,” in IEEE International Conference on Audio, Speech and Signal Processing, New Orleans, USA, 2017. [ bib pdf ]
    @inproceedings{Kounades-ICASSP-2017,
    title={An {EM} algorithm for joint source separation and diarisation of multichannel convolutive mixtures},
    author={Dionyssos Kounades-Bastian and Laurent Girin and Xavier Alameda-Pineda and Sharon Gannot and Radu Horaud},
    booktitle={IEEE International Conference on Audio, Speech and Signal Processing},
    year={2017},
    address={New Orleans, USA},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Kounades-ICASSP-2017.pdf}
    }

2016

  1. X. Alameda-Pineda, E. Ricci, Y. Yan, and N. Sebe, “Recognizing Emotions from Abstract Paintings using Non-Linear Matrix Completion,” in IEEE International Conference on Computer Vision and Pattern Recognition, Las Vegas, USA, 2016. [ bib pdf code ]
    @inproceedings{Alameda-CVPR-2016,
      author = {Xavier Alameda-Pineda and Elisa Ricci and Yan Yan and Nicu Sebe},
      title = {Recognizing Emotions from Abstract Paintings using Non-Linear Matrix Completion},
      booktitle = {IEEE International Conference on Computer Vision and Pattern Recognition},
      year = {2016},
      soft = {https://github.com/xavirema/nlmc},
      address = {Las Vegas, USA},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-CVPR-2016.pdf}
    }
  2. Y. Ban, S. Ba, X. Alameda-Pineda, and R. Horaud, “Tracking Multiple Persons Based on a Variational Bayesian Model,” in European Conference on Computer Vision Workshops, Amsterdam, 2016, pp. 52-67. [ bib pdf ]
    @inproceedings{Ban-ECCVW-2016,
      title={Tracking Multiple Persons Based on a Variational Bayesian Model},
      author={Ban, Yutong and Ba, Sileye and Alameda-Pineda, Xavier and Horaud, Radu},
      booktitle={European Conference on Computer Vision Workshops},
      pages={52--67},
      address={Amsterdam},
      year={2016},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Ban-ECCVW-2016.pdf}
    }
  3. D. Kounades-Bastian, L. Girin, X. Alameda-Pineda, S. Gannot, and R. Horaud, “An inverse-gama source variance prior with factorized parametrization for audio source separation,” in IEEE International Conference on Audio, Speech and Signal Processing, Shangai, China, 2016, pp. 136-140. [ bib pdf ]
    @inproceedings{Kounades-ICASSP-2016,
      TITLE = {An inverse-gama source variance prior with factorized parametrization for audio source separation},
      AUTHOR = {Kounades-Bastian, Dionyssos and Girin, Laurent and Alameda-Pineda, Xavier and Gannot, Sharon and Horaud, Radu},
      BOOKTITLE = {IEEE International Conference on Audio, Speech and Signal Processing},
      YEAR = {2016},
      address = {Shangai, China},
      pages={136-140},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Kounades-ICASSP-2016.pdf}
    }
  4. S. Tulyakov, X. Alameda-Pineda, E. Ricci, L. Yin, J. F. Cohn, and N. Sebe, “Self-Adaptive Matrix Completion for Heart Rate Estimation from Face Videos under Realistic Conditions,” in IEEE International Conference on Computer Vision and Pattern Recognition, Las Vegas, USA, 2016. [ bib pdf ]
    @inproceedings{Tulyakov-CVPR-2016,
        author = {Sergey Tulyakov and Xavier Alameda-Pineda and Elisa Ricci and Lijun Yin and Jeffrey F. Cohn and Nicu Sebe},
        title = {Self-Adaptive Matrix Completion for Heart Rate Estimation from Face Videos under Realistic Conditions},
        booktitle = {IEEE International Conference on Computer Vision and Pattern Recognition},
        year = {2016},
        address = {Las Vegas, USA},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Tulyakov-CVPR-2016.pdf}
    }
  5. W. Wang, Y. Yan, F. Nie, X. Alameda-Pineda, S. Yan, and N. Sebe, “Projective Unsupervised Flexible Embedding with Optimal Graph,” in British Machine Vision Conference, York, United Kingdom, 2016. [ bib pdf ]
    @inproceedings{Wang-BMVC-2016,
    title = {Projective Unsupervised Flexible Embedding with Optimal Graph},
    author = {Wei Wang and Yan Yan and Feiping Nie and Xavier Alameda-Pineda and Shuicheng Yan and Nicu Sebe},
    booktitle = {British Machine Vision Conference},
    year = 2016,
    address = {York, United Kingdom},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Wang-BMVC-2016.pdf}
    }
  6. D. Xu, X. Alameda-Pineda, J. Song, E. Ricci, and N. Sebe, “Academic Coupled Dictionary Learning for Sketch-based Image Retrieval,” in ACM International Conference on Multimedia, Amsterdam, The Netherlands, 2016. [ bib pdf ]
    @inproceedings{Xu-ACMMM-2016,
        title={Academic Coupled Dictionary Learning for Sketch-based Image Retrieval},
        author={Dan Xu and Xavier Alameda-Pineda and Jingkuan Song and Elisa Ricci and Nicu Sebe},
        booktitle={ACM International Conference on Multimedia},
        year={2016},
        address={Amsterdam, The Netherlands},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Xu-ACMMM-2016.pdf}
    }
  7. D. Xu, J. Song, X. Alameda-Pineda, E. Ricci, and N. Sebe, “Multi-Paced Dictionary Learning for Cross-Domain Retrieval and Recognition,” in IEEE International Conference on Pattern Recognition, Cancun, Mexico, 2016. [ bib pdf ]
    Award Best Intel Scientific Award
    @inproceedings{Xu-ICPR-2016,
        title={Multi-Paced Dictionary Learning for Cross-Domain Retrieval and Recognition},
        author={Dan Xu and Jingkuan Song and Xavier Alameda-Pineda and Elisa Ricci and Nicu Sebe},
        booktitle={IEEE International Conference on Pattern Recognition},
        year={2016},
        address={Cancun, Mexico},
        award={Best Intel Scientific Award},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Xu-ICPR-2016.pdf}
    }

2015

  1. X. Alameda-Pineda, Y. Yan, E. Ricci, O. Lanz, and N. Sebe, “Analyzing Free-standing Conversational Groups: A Multimodal Approach,” in ACM International Conference on Multimedia, Brisbane, Australia, 2015, pp. 4-15. [ bib pdf ]
    Award Best Paper Award
    @inproceedings{Alameda-ACMMM-2015,
      author = {Xavier Alameda-Pineda and Yan Yan and Elisa Ricci and Oswald Lanz and Nicu Sebe},
      title = {Analyzing Free-standing Conversational Groups: A Multimodal Approach}, 
      booktitle = {ACM International Conference on Multimedia},
      year = {2015},
      award = {Best Paper Award},
      pages = {4--15},
      address = {Brisbane, Australia},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-ACMMM-2015.pdf}
    }
  2. D. Kounades-Bastian, L. Girin, X. Alameda-Pineda, S. Gannot, and R. Horaud, “A Variational EM Algorithm for the Separation of Moving Sound Sources,” in IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, New Paltz, USA, 2015, pp. 1-5. [ bib pdf ]
    Award Best Student Paper Award
    @inproceedings{Kounades-WASPAA-2015,
      TITLE = {{A Variational EM Algorithm for the Separation of Moving Sound Sources}},
      AUTHOR = {Kounades-Bastian, Dionyssos and Girin, Laurent and Alameda-Pineda, Xavier and Gannot, Sharon and Horaud, Radu},
      BOOKTITLE = {{IEEE Workshop on Applications of Signal Processing to Audio and Acoustics}},
      YEAR = {2015},
      award={Best Student Paper Award},
      pages = {1--5},
      address = {New Paltz, USA},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Kounades-WASPAA-2015.pdf}
    }

2014

  1. I. Gebru, X. Alameda-Pineda, R. Horaud, and F. Forbes, “Audio-Visual Speaker Localization via Weighted Clustering,” in IEEE Workshop on Machine Learning for Signal Processing, Reims, France, 2014, pp. 1-6. [ bib pdf ]
    @inproceedings{Gebru-MLSP-2014,
        title = {{Audio-Visual Speaker Localization via Weighted Clustering}},
        author = {Gebru, Israel-Dejene and Alameda-Pineda, Xavier and Horaud, Radu and Forbes, Florence},
        booktitle = {{IEEE Workshop on Machine Learning for Signal Processing}},
        year = {2014},
        pages = {1--6},
        address = {Reims, France},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Gebru-MLSP-2014.pdf}
    }
  2. M. Janvier, X. Alameda-Pineda, L. Girin, and R. Horaud, “Sound Representation and Classification Benchmark for Domestic Robots,” in IEEE International Conference on Robotics and Automation, Hong Kong, China, 2014, pp. 6285-6292. [ bib pdf arxiv ]
    @inproceedings{Janvier-ICRA-2014,
      AUTHOR = {Janvier, Maxime and Alameda-Pineda, Xavier and Girin, Laurent and Horaud, Radu},
      TITLE = {{Sound Representation and Classification Benchmark for Domestic Robots}},
      BOOKTITLE = {{IEEE International Conference on Robotics and Automation}},
      YEAR = {2014},
      pages = {6285--6292},
      address = {Hong Kong, China},
      arxiv = {http://arxiv.org/abs/1402.3689},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Janvier-ICRA-2014.pdf}
    }

2013

  1. X. Alameda-Pineda, J. Sanchez-Riera, and R. Horaud, “Benchmarking Methods for Audio-Visual Recognition Using Tiny Training Sets,” in IEEE International Conference on Acoustics, Speech, and Signal Processing, Vancouver, Canada, 2013, pp. 3662-3666. [ bib pdf ]
    @Inproceedings{Alameda-ICASSP-2013,
      author       = "Alameda-Pineda, Xavier and Sanchez-Riera, Jordi and Horaud, Radu",
      title        = "Benchmarking  Methods for Audio-Visual Recognition Using Tiny Training Sets",
      booktitle    = "IEEE International Conference on Acoustics, Speech, and Signal Processing",
      year         = "2013",
      pages = {3662--3666},
      address = {Vancouver, Canada},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-ICASSP-2013.pdf}
    }
  2. X. Alameda-Pineda, R. Horaud, and B. Mourrain, “The Geometry of Sound Source Localization Using Non-Coplanar Microphone Arrays,” in IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, New Paltz, USA, 2013, pp. 1-4. [ bib pdf code ]
    @inproceedings{Alameda-WASPAA-2013,
      author = {Xavier Alameda-Pineda and Radu Horaud and Bernard Mourrain},
      title = {The Geometry of Sound Source Localization Using Non-Coplanar Microphone Arrays},
      booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics},
      year = {2013},
      pages = {1--4},
      address = {New Paltz, USA},
      soft = {https://team.inria.fr/perception/the-gtde-matlab-toolbox/},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-WASPAA-2013.pdf}
    }
  3. J. Cech, R. Mittal, A. Deleforge, J. Sanchez-Riera, X. Alameda-Pineda, and R. Horaud, “Active-Speaker Detection and Localization with Microphones and Cameras Embedded into a Robotic Head,” in IEEE-RAS International Conference on Humanoid Robots, Atlanta, USA, 2013, pp. 203-210. [ bib pdf ]
    @inproceedings{Cech-Humanoids-2013, 
      author = {Cech, Jan and Mittal, Ravi and Deleforge, Antoine and Sanchez-Riera, Jordi and Alameda-Pineda, Xavier and Horaud, Radu}, 
      title = {{Active-Speaker Detection and Localization with Microphones and Cameras Embedded into a Robotic Head}}, 
      booktitle = {{IEEE-RAS International Conference on Humanoid Robots}},
      year = {2013},
      pages = {203--210},
      address = {Atlanta, USA},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Cech-Humanoids-2013.pdf}
    }

2012

  1. X. Alameda-Pineda and R. Horaud, “Geometrically-constrained Robust Time Delay Estimation Using Non-coplanar Microphone Arrays,” in European Signal Processing Conference, Bucarest, Romania, 2012, pp. 1309-1313. [ bib pdf code ]
    @InProceedings{Alameda-EUSIPCO-2012,
      author       = "Alameda-Pineda, Xavier and Horaud, Radu",
      title        = "Geometrically-constrained Robust Time Delay Estimation Using Non-coplanar Microphone Arrays",
      booktitle    = "European Signal Processing Conference",
      year         = "2012",
      pages = {1309--1313},
      address = {Bucarest, Romania},
      soft = {https://team.inria.fr/perception/the-gtde-matlab-toolbox/},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-EUSIPCO-2012.pdf}
    }
  2. M. Janvier, X. Alameda-Pineda, L. Girin, and R. Horaud, “Sound-Event Recognition with a Companion Humanoid,” in IEEE-RAS International Conference on Humanoid Robotics, Osaka, Japan, 2012, pp. 104-111. [ bib pdf ]
    @InProceedings{Janvier-Humanoids-2012,
      author       = "Janvier, Maxime and Alameda-Pineda, Xavier and Girin, Laurent and Horaud, Radu",
      title        = "Sound-Event Recognition with a Companion Humanoid",
      booktitle    = "IEEE-RAS International Conference on Humanoid Robotics",
      year         = "2012",
      pages = {104--111},
      address = {Osaka, Japan},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Janvier-Humanoids-2012.pdf}
    }
  3. J. Sanchez-Riera, X. Alameda-Pineda, J. Wienke, A. Deleforge, S. Arias, J. Cech, S. Wrede, and R. Horaud, “Online Multimodal Speaker Detection for Humanoid Robots,” in IEEE-RAS International Conference on Humanoid Robotics, Osaka, Japan, 2012, pp. 126-133. [ bib pdf code ]
    @InProceedings{Sanchez-Humanoids-2012,
      author       = "Sanchez-Riera, Jordi and Alameda-Pineda, Xavier and Wienke, Johannes and Deleforge, Antoine and Arias, Soraya and Cech, Jan and Wrede, Sebastian and Horaud, Radu",
      title        = "Online Multimodal Speaker Detection for Humanoid Robots",
      booktitle    = "IEEE-RAS International Conference on Humanoid Robotics",
      year         = "2012",
      soft         = "http://code.humavips.eu",
      address = {Osaka, Japan},
      pages = {126--133},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Sanchez-Humanoids-2012.pdf}
    }
  4. J. Sanchez-Riera, X. Alameda-Pineda, and R. Horaud, “Audio-Visual Robot Command Recognition,” in IEEE/ACM International Conference on Multimodal Interaction, Santa Monica, USA, 2012, pp. 371-378. [ bib pdf ]
    @InProceedings{Sanchez-ICMI-2012,
      author       = "Sanchez-Riera, Jordi and Alameda-Pineda, Xavier and Horaud, Radu",
      title        = "Audio-Visual Robot Command Recognition",
      booktitle    = "IEEE/ACM International Conference on Multimodal Interaction",
      year         = "2012",
      address = {Santa Monica, USA},
      pages = {371--378},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Sanchez-ICMI-2012.pdf}
    }

2011

  1. X. Alameda-Pineda, V. Khalidov, R. Horaud, and F. Forbes, “Finding Audio-Visual Events in Informal Social Gatherings,” in IEEE/ACM International Conference on Multimodal Interfaces, Alicante, Spain, 2011, pp. 247-254. [ bib pdf code ]
    Award Oustanding Paper Award
    @InProceedings{Alameda-ICMI-2011,
      author       = "Alameda-Pineda, Xavier and Khalidov, Vasil and Horaud, Radu and Forbes, Florence",
      title        = "Finding Audio-Visual Events in Informal Social Gatherings",
      booktitle    = "IEEE/ACM International Conference on Multimodal Interfaces",
      year         = "2011",
      award         = "Oustanding Paper Award",
      pages = {247--254},
      address = {Alicante, Spain},
      soft = {https://code.humavips.eu},
      pdf={http://xavirema.eu/wp-content/papercite-data/pdf/Alameda-ICMI-2011.pdf}
    }

2008

  1. J. C. Rolon, P. Salembier, and X. Alameda-Pineda, “Image Compression with Generalized Lifting and partial knowledge of the signal PDF,” in IEEE International Conference on Image Processing, San Diego, USA, 2008, pp. 129-132. [ bib ]
    @InProceedings{Rolon-ICIP-2008,
      author       = "Rolon, Julio C. and Salembier, Philippe and Alameda-Pineda, Xavier",
      title        = "Image Compression with Generalized Lifting and partial knowledge of the signal PDF",
      booktitle    = "IEEE International Conference on Image Processing",
      year         = "2008",
      pages = {129--132},
      address = {San Diego, USA},
    }