Research

Vision & Language

  1. ReGen: A good Generative zero-shot video classifier should be Rewarded. bibtex A. Bulat, E. Sanchez-Lozano, B. Matinez, G. Tzimiropoulos. In International Conference on Computer Vision (ICCV), 2023.
    @article{bulat_iccv23a,
      author = {A. Bulat, E. Sanchez-Lozano, B. Matinez, G. Tzimiropoulos},
      title = {ReGen: A good Generative zero-shot video classifier should be Rewarded},
      journal = {International Conference on Computer Vision (ICCV)},  
      year = {2023},
    }
  2. Black Box Few-Shot Adaptation for Vision-Language models. bibtex link Y. Ouali, A. Bulat, B. Matinez, G. Tzimiropoulos. In International Conference on Computer Vision (ICCV), 2023.
    @article{yassine_iccv23,
      url = {https://arxiv.org/abs/2304.01752},
      author = {Y. Ouali, A. Bulat, B. Matinez, G. Tzimiropoulos},
      title = {Black Box Few-Shot Adaptation for Vision-Language models},
      journal = {International Conference on Computer Vision (ICCV)},  
      year = {2023},
    }
  3. Bayesian Prompt Learning for Image-Language Model Generalization. bibtex link M. Derakhshani, E. Sanchez, A. Bulat, V. Turrisi da Costa, C. Snoek, G. Tzimiropoulos, B. Martinez. In International Conference on Computer Vision (ICCV), 2023.
    @article{derakhshani_iccv23,
      url = {https://arxiv.org/abs/2210.02390},
      author = {M. Derakhshani, E. Sanchez, A. Bulat, V. Turrisi da Costa, C. Snoek, G. Tzimiropoulos, B. Martinez},
      title = {Bayesian Prompt Learning for Image-Language Model Generalization},
      journal = {International Conference on Computer Vision (ICCV)},  
      year = {2023},
    }

Action recognition

  1. Few-shot Action Recognition with Prototype-centered Attentive Learning. bibtex J.M. Pérez-Rúa, B. Martinez, X. Zhu, A. Toisoul, V. Escorcia, T. Xiang. In British Machine Vision Conference (BMVC), 2021.
    @InProceedings{w3_CVPR21,
    author = {J.M. Pérez-Rúa, B. Martinez, X. Zhu, A. Toisoul, V. Escorcia, T. Xiang},
    title = {Few-shot Action Recognition with Prototype-centered Attentive Learning},
    booktitle = {British Machine Vision Conference (BMVC)},
    year = {2021}
    }
  2. Egocentric Action Recognition by Video Attention and Temporal Context. bibtex link J. Perez-Rua and A. Toisoul and B. Martinez and V. Escorcia and L. Zhang and X. Zhu and T. Xiang. In EPIC-Kitchens challenge, CVPR Workshops, 2020.
    @article{perezrua_cvprw20,
      author    = {J. Perez-Rua and A. Toisoul and B. Martinez and V. Escorcia and L. Zhang and X. Zhu and T. Xiang},
      title     = {Egocentric Action Recognition by Video Attention and Temporal Context},
      journal   = {EPIC-Kitchens challenge, CVPR Workshops},
      year      = {2020},
      url       = {https://arxiv.org/abs/2007.01883},
    }
  3. Knowing What, Where and When to Look: Efficient Video Action Modeling with Attention. bibtex link J. Perez-Rua and B. Martinez and X. Zhu and A. Toisoul and V. Escorcia and T. Xiang. In British Machine Vision Conference (BMVC), 2021.
    @article{perezrua_arxiv20,
      author    = {J. Perez-Rua and B. Martinez and X. Zhu and A. Toisoul and V. Escorcia and T. Xiang},
      title     = {Knowing What, Where and When to Look: Efficient Video Action Modeling
                   with Attention},
      journal   = {British Machine Vision Conference (BMVC)},
      year      = {2021},
      url       = {https://arxiv.org/abs/2004.01278},
    }
  4. Action Recognition With Spatial-Temporal Discriminative Filter Banks. bibtex B. Martinez, D. Modolo, and Y. Xiong and J. Tighe. In IEEE International Conference on Computer Vision (ICCV), 2019.
    @InProceedings{Martinez_2019_ICCV,
    author = {B. Martinez, D. Modolo, and Y. Xiong and J. Tighe},
    title = {Action Recognition With Spatial-Temporal Discriminative Filter Banks},
    booktitle = {IEEE International Conference on Computer Vision (ICCV)},
    year = {2019}
    }

Binary Neural Networks

  1. High-Capacity Expert Binary Networks. bibtex A. Bulat, B. Martinez, G. Tzimiropoulos. In International Conference on Learning Representations (ICLR), 2021.
    @article{bulat_iclr21,
      author    = {A. Bulat, B. Martinez, G. Tzimiropoulos},
      title = {High-Capacity Expert Binary Networks},
      journal = {International Conference on Learning Representations (ICLR)},
      year  = {2021}
    }
    
  2. BATS: Binary ArchitecTure Search. bibtex A. Bulat and B. Martinez and G. Tzimiropoulos. In European Conf. on Computer Vision (ECCV), 2020.
    @article{adrian_eccv20,
      author    = {A. Bulat and B. Martinez and G. Tzimiropoulos},
      title     = {BATS: Binary ArchitecTure Search},
      journal   = {European Conf. on Computer Vision (ECCV)},
      year      = {2020}
    }
  3. Training binary neural networks with real-to-binary convolutions. bibtex B. Martinez and J. Yang, and A. Bulat and Y. Tzimiropoulos. In International Conference on Learning Representations (ICLR), 2020.
    @InProceedings{Martinez_2020ICLR,
    author = {B. Martinez and J. Yang, and A. Bulat and Y. Tzimiropoulos},
    title = {Training binary neural networks with real-to-binary convolutions},
    booktitle = {International Conference on Learning Representations (ICLR)},
    year = {2020}
    }

Lipreading

  1. Towards practical lipreading with distilled and efficient models. pdf bibtex P. Ma*, B. Martinez*, S. Petridis, M. Pantic. In Int’l Conf. on Acoustics, Speech, and Signal Processing (ICASSP), 2021.
    @article{jing_eccv20,
      author    = {P. Ma*, B. Martinez*, S. Petridis, M. Pantic},
      title     = {Towards practical lipreading with distilled and efficient models},
      journal   = {Int’l Conf. on Acoustics, Speech, and Signal Processing (ICASSP)},
      year      = {2021}
    }
  2. Lipreading using Temporal Convolutional Networks. bibtex B. Martinez, P. Ma, S. Petridis, M. Pantic. In International Conference on Acoustics, Speech, and Signal Processing (ICASSP), 2020.
    @InProceedings{Martinez_2020ICLR,
        author = {B. Martinez, P. Ma, S. Petridis, M. Pantic},
        title = {Lipreading using Temporal Convolutional Networks},
        booktitle = {International Conference on Acoustics, Speech, and Signal Processing (ICASSP)}, 
        year = {2020}
    }

Knowledge Distillation

  1. Knowledge distillation via softmax regression representation learning. bibtex link J. Yang, B. Martinez, A. Bulat, G. Tzimiropoulos. In International Conference on Learning Representations (ICLR), 2021.
    @article{jang_iclr21,
      author    = {J. Yang, B. Martinez, A. Bulat, G. Tzimiropoulos},
      title = {Knowledge distillation via softmax regression representation learning},
      journal = {International Conference on Learning Representations (ICLR)},
      year  = {2021},
      url = {https://github.com/jingyang2017/KD_SRRL}
    }