I am a PhD student, currently affiliated with the Computer Vision Group at the University of Bonn, Germany. I am supervised by Professor Dr. Jürgen Gall, and am working in the domain of Long-Term Multimodal Video Understanding.
Previously I was an Associate Researcher in computer vision, affiliated with the Intelligent Visual Analytics Lab (IVAL) at the Mohamed Bin Zayed University of Artificial Intelligence (MBZUAI). I was supervised by Dr. Salman Khan.
I completed my master’s degree in Image Processing and Computer Vision (IPCV) funded by the Erasmus Mundus Joint Master’s Degree (EMJMD) scholarship program. During the master’s program, I was fortunate to have interned at the Empathic Computing Lab supervised by Dr. Mark Billinghurst. I completed my master’s thesis in the CVLAB at EPFL supervised by Dr. Mathieu Salzmann.
I hold an undergraduate degree in Electrical Engineering, with a minor in computer science, from Habib University in Karachi, Paksitan.
My previous website listing high-school, undrgraduate and graduate courses and projects can be found at talalwasim.weebly.com.
@inproceedings{yi2024vpanda, title={Video-Panda: Parameter-efficient Alignment for Encoder-free Video-Language Models}, author={Jinhui Yi* and Syed Talal Wasim* and Yanan Luo* and Muzammal Naseer and Juergen Gall}, booktitle={CVPR} year={2025}}
@inproceedings{shaker2024groupmamba, title={GroupMamba: Parameter-Efficient and Accurate Group Visual State Space Model}, author={Abdelrahman Shaker and Syed Talal Wasim and Salman Khan and Juergen Gall and Fahad Shahbaz Khan}, booktitle={CVPR}, year={2025}}
@inproceedings{velayudhan2024sting, title={STING-BEE: Towards Vision-Language Model for Real-World X-ray Baggage Security Inspection}, author={Divya Velayudhan and Abdelfatah Ahmed and Mohamad Alansari and Neha Gour and Abderaouf Behouch and Taimur Hassan and Syed Talal Wasim and Nabil Maalej and Muzammal Naseer and Juergen Gall and Mohammed Bennamoun and Ernesto Damiani and Naoufel Werghi}, booktitle={CVPR} year={2025}}
@inproceedings{shaker2025mavos, title={Efficient Video Object Segmentation via Modulated Cross-Attention Memory}, author={Abdelrahman Shaker and Syed Talal Wasim and Martin Danelljan and Salman Khan and Ming-Hsuan Yang and Fahad Shahbaz Khan}, booktitle={WACV} year={2025}}
@article{suleman2024stablemamba, title={Distillation-free Scaling of Large SSMs for Images and Videos}, author={Hamid Suleman* and Syed Talal Wasim* and Muzammal Naseer and Juergen Gall}, journal={arxiv preprint, arxiv:2409.11867}, year={2024}}
@inproceedings{wasim2024vgdino, title={Video-GroundingDINO: Towards Open-Vocabulary Spatio-Temporal Video Grounding}, author={Syed Talal Wasim and Muzammal Naseer and Salman Khan and Ming-Hsuan Yang and Fahad Shahbaz Khan}, booktitle={CVPR} year={2024}}
@inproceedings{yousuf2024arvpt, title={AR-VPT: Simple Auto-Regressive Prompts for Adapting Frozen ViTs to Videos}, author={Muhammad Zain Yousuf and Syed Talal Wasim and Syed Nouman Hasany and Muhammad Farhan}, booktitle={VISAPP} year={2024}}
@inproceedings{wasim2023textres, title={Hardware Resilience Properties of Text-Guided Image Classifiers}, author={Syed Talal Wasim and Kabila Haile Soboka and Abdulrahman Mahmoud and Salman Khan and David Brooks and Gu-Yeon Wei}, booktitle={NeurIPS} year={2023}}
@inproceedings{wasim2023vfn, title={Video-FocalNets: Spatio-Temporal Focal Modulation for Video Action Recognition}, author={Syed Talal Wasim* and Muhammad Uzair Khattak* and Muzammal Naseer and Salman Khan and Mubarak Shah and Fahad Shahbaz Khan}, booktitle={ICCV} year={2023}}
@inproceedings{khattak2023promptsrc, title={Self-regulating Prompts: Foundational Model Adaptation without Forgetting}, author={Muhammad Uzair Khattak* and Syed Talal Wasim* and Muzammal Naseer and Salman Khan and Ming-Hsuan Yang and Fahad Shahbaz Khan}, booktitle={ICCV} year={2023}}
@inproceedings{wasim2023vita, title={Vita-CLIP: Video and text adaptive CLIP via Multimodal Prompting}, author={Syed Talal Wasim and Muzammal Naseer and Salman Khan and Fahad Shahbaz Khan and Mubarak Shah}, booktitle={CVPR} year={2023}}
@article{wasim2023gest, title={Toward automatic typography analysis: serif classification and font similarities}, author={Syed Talal Wasim and Romain Collaud and Lara Défayes and Nicolas Henchoz and Mathieu Salzmann and Delphine Ribes}, journal={Journal of Data Mining in Digital Humanities (JDMDH)}, year={2023}}
@article{wasim2022ecl, title={Using facial micro-expressions in combination with EEG and physiological signals for emotion recognition}, author={Nastaran Saffaryazdi and Syed Talal Wasim and Kuldeep Dileep and Alireza Farrokhi Nia and Suranga Nanayakkara and Elizabeth Broadbent and Mark Billinghurst}, journal={Frontiers in Psychology}, year={2022}}
@inproceedings{wasim2021cv4animals, title={Sim-to-Real Transfer for Object Detection and Localization on Animals}, author={Syed Talal Wasim and Syed N. Hasany and Kainat Abbasi and Huda Feroz and Anisa A. Ahmed and Mudasir H. Shaikh and Muhammad Farhan}, booktitle={CV4Animals CVPR Workshop}, year={2021}}
Powered by Jekyll and Minimal Light theme.