Publications

40 / 4,029 publications found.


  •  Li, D., Zhang, J., Egger, B., Chatterjee, M., Lohit, S., Marks, T.K., Cherian, A., "AssemblyBench: Physics-Aware Assembly of Complex Industrial Objects", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2026.
    BibTeX TR2026-076 PDF Video Data Software
    • @inproceedings{Li2026jun,
    • author = {Li, Danrui and Zhang, Jiahao and Egger, Bernhard and Chatterjee, Moitreya and Lohit, Suhas and Marks, Tim K. and Cherian, Anoop},
    • title = {{AssemblyBench: Physics-Aware Assembly of Complex Industrial Objects}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2026,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2026-076}
    • }
  •  Liu, X., Miraldo, P., Lohit, S., Jiang, H., Sawada, N., Tai, Y.-W., Tang, C.-K., Chatterjee, M., "Point4Cast: Streaming Dynamic Scene Reconstruction and Forecasting", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2026.
    BibTeX TR2026-077 PDF
    • @inproceedings{Liu2026jun,
    • author = {Liu, Xinhang and Miraldo, Pedro and Lohit, Suhas and Jiang, Huaizu and Sawada, Naoko and Tai, Yu-Wing and Tang, Chi-Keung and Chatterjee, Moitreya},
    • title = {{Point4Cast: Streaming Dynamic Scene Reconstruction and Forecasting}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2026,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2026-077}
    • }
  •  Shenoy, V., Lohit, S., Mansour, H., Chellappa, R., Marks, T.K., "Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models", IEEE Transactions on Image Processing, DOI: 10.1109/​TIP.2026.3671653, Vol. 35, pp. 2755-2770, March 2026.
    BibTeX TR2026-031 PDF
    • @article{Shenoy2026mar,
    • author = {Shenoy, Vineet and Lohit, Suhas and Mansour, Hassan and Chellappa, Rama and Marks, Tim K.},
    • title = {{Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models}},
    • journal = {IEEE Transactions on Image Processing},
    • year = 2026,
    • volume = 35,
    • pages = {2755--2770},
    • month = mar,
    • doi = {10.1109/TIP.2026.3671653},
    • issn = {1941-0042},
    • url = {https://www.merl.com/publications/TR2026-031}
    • }
  •  Moosa, I.M., Lohit, S., Wang, Y., Chatterjee, M., Yin, W., "Understanding Dynamic Compute Allocation in Recurrent Transformers", arXiv, February 2026.
    BibTeX arXiv
    • @article{Moosa2026feb,
    • author = {Moosa, Ibraheem Muhammad and Lohit, Suhas and Wang, Ye and Chatterjee, Moitreya and Yin, Wenpeng},
    • title = {{Understanding Dynamic Compute Allocation in Recurrent Transformers}},
    • journal = {arXiv},
    • year = 2026,
    • month = feb,
    • url = {https://arxiv.org/abs/2602.08864}
    • }
  •  Zhang, H., Peng, K.-C., Lohit, S., Yeh, R., "Auto-Vocabulary 3D Object Detection", arXiv, December 2025.
    BibTeX arXiv
    • @article{Zhang2025dec3,
    • author = {Zhang, Haomeng and Peng, Kuan-Chuan and Lohit, Suhas and Yeh, Raymond},
    • title = {{Auto-Vocabulary 3D Object Detection}},
    • journal = {arXiv},
    • year = 2025,
    • month = dec,
    • url = {https://arxiv.org/abs/2512.16077}
    • }
  •  Xiang, X., Peng, K.-C., Lohit, S., Jones, M.J., Zhang, J., "Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes", British Machine Vision Conference (BMVC), November 2025.
    BibTeX TR2025-162 PDF Video Data Presentation
    • @inproceedings{Xiang2025nov,
    • author = {{{Xiang, Xinhao and Peng, Kuan-Chuan and Lohit, Suhas and Jones, Michael J. and Zhang, Jiawei}}},
    • title = {{{Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes}}},
    • booktitle = {British Machine Vision Conference (BMVC)},
    • year = 2025,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2025-162}
    • }
  •  Shenoy, V., Wu, S., Comas, A., Lohit, S., Mansour, H., Marks, T.K., "Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography", IEEE Access, DOI: 10.1109/​ACCESS.2025.3617284, Vol. 13, pp. 173923-173938, October 2025.
    BibTeX TR2025-145 PDF
    • @article{Shenoy2025oct,
    • author = {Shenoy, Vineet and Wu, Shaoju and Comas, Armand and Lohit, Suhas and Mansour, Hassan and Marks, Tim K.},
    • title = {{Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography}},
    • journal = {IEEE Access},
    • year = 2025,
    • volume = 13,
    • pages = {173923--173938},
    • month = oct,
    • doi = {10.1109/ACCESS.2025.3617284},
    • url = {https://www.merl.com/publications/TR2025-145}
    • }
  •  Hu, Y., Lohit, S., Kamilov, U., Marks, T.K., "Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal", IEEE Transactions on Geoscience and Remote Sensing, DOI: 10.1109/​TGRS.2025.3604654, Vol. 63, September 2025.
    BibTeX TR2025-138 PDF
    • @article{Hu2025sep2,
    • author = {Hu, Yuyang and Lohit, Suhas and Kamilov, Ulugbek and Marks, Tim K.},
    • title = {{Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal}},
    • journal = {IEEE Transactions on Geoscience and Remote Sensing},
    • year = 2025,
    • volume = 63,
    • month = sep,
    • doi = {10.1109/TGRS.2025.3604654},
    • issn = {1558-0644},
    • url = {https://www.merl.com/publications/TR2025-138}
    • }
  •  Hegde, D., Lohit, S., Peng, K.-C., Jones, M.J., Patel, V.M., "Multimodal 3D Object Detection on Unseen Domains", IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop, June 2025, pp. 2499-2509.
    BibTeX TR2025-078 PDF
    • @inproceedings{Hegde2025jun,
    • author = {Hegde, Deepti and Lohit, Suhas and Peng, Kuan-Chuan and Jones, Michael J. and Patel, Vishal M.},
    • title = {{Multimodal 3D Object Detection on Unseen Domains}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop},
    • year = 2025,
    • pages = {2499--2509},
    • month = jun,
    • url = {https://www.merl.com/publications/TR2025-078}
    • }
  •  Sawada, N., Miraldo, P., Lohit, S., Marks, T.K., Chatterjee, M., "FreBIS: Frequency-Based Stratification for Neural Implicit Surface Representations", IEEE Conference on Computer Vision and Pattern Recognition Workshop (CVPR), DOI: 10.1109/​CVPRW67362.2025.00041, June 2025, pp. 369-379.
    BibTeX TR2025-074 PDF
    • @inproceedings{Sawada2025jun,
    • author = {Sawada, Naoko and Miraldo, Pedro and Lohit, Suhas and Marks, Tim K. and Chatterjee, Moitreya},
    • title = {{FreBIS: Frequency-Based Stratification for Neural Implicit Surface Representations}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition Workshop (CVPR)},
    • year = 2025,
    • pages = {369--379},
    • month = jun,
    • doi = {10.1109/CVPRW67362.2025.00041},
    • url = {https://www.merl.com/publications/TR2025-074}
    • }
  •  Basu, S., Lohit, S., Brand, M., "G-RepsNet: A Lightweight Construction of Equivariant Net- works for Arbitrary Matrix Groups", Transactions on Machine Learning Research (TMLR), May 2025.
    BibTeX TR2025-056 PDF Software
    • @article{Basu2025may,
    • author = {Basu, Sourya and Lohit, Suhas and Brand, Matthew},
    • title = {{G-RepsNet: A Lightweight Construction of Equivariant Net- works for Arbitrary Matrix Groups}},
    • journal = {Transactions on Machine Learning Research (TMLR)},
    • year = 2025,
    • month = may,
    • issn = {2835-8856},
    • url = {https://www.merl.com/publications/TR2025-056}
    • }
  •  Tang, H., Ellis, K., Lohit, S., Jones, M.J., Chatterjee, M., "Programmatic Video Prediction Using Large Language Models", International Conference on Learning Representations Workshops (ICLRW), April 2025.
    BibTeX TR2025-049 PDF
    • @inproceedings{Tang2025apr,
    • author = {Tang, Hao and Ellis, Kevin and Lohit, Suhas and Jones, Michael J. and Chatterjee, Moitreya},
    • title = {{Programmatic Video Prediction Using Large Language Models}},
    • booktitle = {International Conference on Learning Representations Workshops (ICLRW)},
    • year = 2025,
    • month = apr,
    • url = {https://www.merl.com/publications/TR2025-049}
    • }
  •  Shenoy, V., Wu, S., Comas, A., Marks, T.K., Lohit, S., Mansour, H., "Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography", arXiv, March 2025.
    BibTeX arXiv
    • @article{Shenoy2025mar2,
    • author = {Shenoy, Vineet and Wu, Shaoju and Comas, Armand and Marks, Tim K. and Lohit, Suhas and Mansour, Hassan},
    • title = {{Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.17351}
    • }
  •  Lohit, S., Marks, T.K., "Rotation-Equivariant Neural Networks for Cloud Removal from Satellite Images", Asilomar Conference on Signals, Systems, and Computers (ACSSC), DOI: 10.1109/​IEEECONF60004.2024.10942613, January 2025, pp. 1360-1365.
    BibTeX TR2025-009 PDF
    • @inproceedings{Lohit2025jan,
    • author = {Lohit, Suhas and Marks, Tim K.},
    • title = {{Rotation-Equivariant Neural Networks for Cloud Removal from Satellite Images}},
    • booktitle = {2024 58th Asilomar Conference on Signals, Systems, and Computers (ACSSC)},
    • year = 2025,
    • pages = {1360--1365},
    • month = jan,
    • publisher = {IEEE},
    • doi = {10.1109/IEEECONF60004.2024.10942613},
    • issn = {2576-2303},
    • isbn = {979-8-3503-5405-8},
    • url = {https://www.merl.com/publications/TR2025-009}
    • }
  •  Cherian, A., Peng, K.-C., Lohit, S., Matthiesen, J., Smith, K., Tenenbaum, J.B., "Evaluating Large Vision-and-Language Models on Children’s Mathematical Olympiads", Advances in Neural Information Processing Systems (NeurIPS), November 2024, pp. 15779-15800.
    BibTeX TR2024-160 PDF Video Presentation
    • @inproceedings{Cherian2024nov,
    • author = {Cherian, Anoop and Peng, Kuan-Chuan and Lohit, Suhas and Matthiesen, Joanna and Smith, Kevin and Tenenbaum, Joshua B.},
    • title = {{Evaluating Large Vision-and-Language Models on Children’s Mathematical Olympiads}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
    • year = 2024,
    • pages = {15779--15800},
    • month = nov,
    • publisher = {NeurIPS Proceedings},
    • url = {https://www.merl.com/publications/TR2024-160}
    • }
  •  Hegde, D., Lohit, S., Peng, K.-C., Jones, M.J., Patel, V.M., "Equivariant Spatio-Temporal Self-Supervision for LiDAR Object Detection", European Conference on Computer Vision (ECCV), Leonardis, A. and Ricci, E. and Roth, S. and Russakovsky, O. and Sattler, T. and Varol, G., Eds., DOI: 10.1007/​978-3-031-73347-5_27, September 2024, pp. 475-491.
    BibTeX TR2024-130 PDF Video Presentation
    • @inproceedings{Hegde2024sep,
    • author = {Hegde, Deepti and Lohit, Suhas and Peng, Kuan-Chuan and Jones, Michael J. and Patel, Vishal M.},
    • title = {{Equivariant Spatio-Temporal Self-Supervision for LiDAR Object Detection}},
    • booktitle = {European Conference on Computer Vision (ECCV)},
    • year = 2024,
    • editor = {Leonardis, A. and Ricci, E. and Roth, S. and Russakovsky, O. and Sattler, T. and Varol, G.},
    • pages = {475--491},
    • month = sep,
    • publisher = {Springer},
    • doi = {10.1007/978-3-031-73347-5_27},
    • issn = {0302-9743},
    • isbn = {978-3-031-73346-8},
    • url = {https://www.merl.com/publications/TR2024-130}
    • }
  •  Ni, H., Egger, B., Lohit, S., Cherian, A., Wang, Y., Koike-Akino, T., Huang, S.X., Marks, T.K., "TI2V-Zero: Zero-Shot Image Conditioning for Text-to-Video Diffusion Models", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2024, pp. 9015-9025.
    BibTeX TR2024-059 PDF Video Software Presentation
    • @inproceedings{Ni2024jun,
    • author = {Ni, Haomiao and Egger, Bernhard and Lohit, Suhas and Cherian, Anoop and Wang, Ye and Koike-Akino, Toshiaki and Huang, Sharon X. and Marks, Tim K.},
    • title = {{TI2V-Zero: Zero-Shot Image Conditioning for Text-to-Video Diffusion Models}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2024,
    • pages = {9015--9025},
    • month = jun,
    • url = {https://www.merl.com/publications/TR2024-059}
    • }
  •  Liu, X., Tai, Y.-W., Tang, C.-K., Miraldo, P., Lohit, S., Chatterjee, M., "Gear-NeRF: Free-Viewpoint Rendering and Tracking with Motion-aware Spatio-Temporal Sampling", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), May 2024, pp. 19667-19679.
    BibTeX TR2024-042 PDF Videos Software
    • @inproceedings{Liu2024may,
    • author = {Liu, Xinhang and Tai, Yu-wing and Tang, Chi-Keung and Miraldo, Pedro and Lohit, Suhas and Chatterjee, Moitreya},
    • title = {{Gear-NeRF: Free-Viewpoint Rendering and Tracking with Motion-aware Spatio-Temporal Sampling}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2024,
    • pages = {19667--19679},
    • month = may,
    • publisher = {IEEE},
    • url = {https://www.merl.com/publications/TR2024-042}
    • }
  •  Basu, S., Lohit, S., Brand, M., "G-RepsNet: A Fast and General Construction of Equivariant Networks for Arbitrary Matrix Groups", arXiv, February 2024.
    BibTeX arXiv
    • @article{Basu2024feb,
    • author = {Basu, Sourya and Lohit, Suhas and Brand, Matthew},
    • title = {{G-RepsNet: A Fast and General Construction of Equivariant Networks for Arbitrary Matrix Groups}},
    • journal = {arXiv},
    • year = 2024,
    • month = feb,
    • url = {https://arxiv.org/abs/2402.15413}
    • }
  •  Carmichael, Z., Jones, L.S., Cherian, A., Michael J., , Scheirer, W., "Pixel-Grounded Prototypical Part Networks", IEEE Winter Conference on Applications of Computer Vision (WACV), DOI: 10.1109/​WACV57701.2024.00470, January 2024.
    BibTeX TR2024-002 PDF Video Software Presentation
    • @inproceedings{Carmichael2024jan,
    • author = {Carmichael, Zachariah and Jones, Lohit, Suhas and Cherian, Anoop and Michael J. and Scheirer, Walter},
    • title = {{Pixel-Grounded Prototypical Part Networks}},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2024,
    • month = jan,
    • doi = {10.1109/WACV57701.2024.00470},
    • url = {https://www.merl.com/publications/TR2024-002}
    • }
  •  Nair, N.G., Cherian, A., Lohit, S., Wang, Y., Koike-Akino, T., Patel, V.M., Marks, T.K., "Steered Diffusion: A Generalized Framework for Plug-and-Play Conditional Image Synthesis", IEEE International Conference on Computer Vision (ICCV), October 2023, pp. 20850-20860.
    BibTeX TR2023-126 PDF Software Presentation
    • @inproceedings{Nair2023sep,
    • author = {Nair, Nithin Gopalakrishnan and Cherian, Anoop and Lohit, Suhas and Wang, Ye and Koike-Akino, Toshiaki and Patel, Vishal M. and Marks, Tim K.},
    • title = {{Steered Diffusion: A Generalized Framework for Plug-and-Play Conditional Image Synthesis}},
    • booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision},
    • year = 2023,
    • pages = {20850--20860},
    • month = oct,
    • publisher = {IEEE/CVF},
    • url = {https://www.merl.com/publications/TR2023-126}
    • }
  •  Sharma, M., Chatterjee, M., Peng, K.-C., Lohit, S., Jones, M.J., "Tensor Factorization for Leveraging Cross-Modal Knowledge in Data-Constrained Infrared Object Detection", IEEE International Conference on Computer Vision Workshops (ICCV), October 2023, pp. 924-932.
    BibTeX TR2023-125 PDF Presentation
    • @inproceedings{Sharma2023oct,
    • author = {Sharma, Manish and Chatterjee, Moitreya and Peng, Kuan-Chuan and Lohit, Suhas and Jones, Michael J.},
    • title = {{Tensor Factorization for Leveraging Cross-Modal Knowledge in Data-Constrained Infrared Object Detection}},
    • booktitle = {IEEE International Conference on Computer Vision Workshops (ICCV)},
    • year = 2023,
    • pages = {924--932},
    • month = oct,
    • url = {https://www.merl.com/publications/TR2023-125}
    • }
  •  Shenoy, V., Marks, T.K., Mansour, H., Lohit, S., "Unrolled IPPG: Video Heart Rate Esitmation via Unrolling Proximal Gradient Descent", IEEE International Conference on Image Processing (ICIP), DOI: 10.1109/​ICIP49359.2023.10222169, September 2023, pp. 2715-2719.
    BibTeX TR2023-116 PDF Video
    • @inproceedings{Shenoy2023sep,
    • author = {Shenoy, Vineet and Marks, Tim K. and Mansour, Hassan and Lohit, Suhas},
    • title = {{Unrolled IPPG: Video Heart Rate Esitmation via Unrolling Proximal Gradient Descent}},
    • booktitle = {IEEE International Conference on Image Processing (ICIP)},
    • year = 2023,
    • pages = {2715--2719},
    • month = sep,
    • publisher = {IEEE},
    • doi = {10.1109/ICIP49359.2023.10222169},
    • isbn = {978-1-7281-9835-4},
    • url = {https://www.merl.com/publications/TR2023-116}
    • }
  •  Jeon, E.S., Lohit, S., Anirudh, R., Turaga, P., "Robust Time Series Recovery and Classification Using Test-time Noise Simulator Networks", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49357.2023.10096888, May 2023.
    BibTeX TR2023-021 PDF Presentation
    • @inproceedings{Jeon2023may,
    • author = {Jeon, Eun Som and Lohit, Suhas and Anirudh, Rushil and Turaga, Pavan},
    • title = {{Robust Time Series Recovery and Classification Using Test-time Noise Simulator Networks}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2023,
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49357.2023.10096888},
    • url = {https://www.merl.com/publications/TR2023-021}
    • }
  •  Cherian, A., Peng, K.-C., Lohit, S., Smith, K., Tenenbaum, J.B., "Are Deep Neural Networks SMARTer than Second Graders?", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), March 2023, pp. 10834-10844.
    BibTeX TR2023-014 PDF Video Data Software Presentation
    • @inproceedings{Cherian2023mar,
    • author = {Cherian, Anoop and Peng, Kuan-Chuan and Lohit, Suhas and Smith, Kevin and Tenenbaum, Joshua B.},
    • title = {{Are Deep Neural Networks SMARTer than Second Graders?}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2023,
    • pages = {10834--10844},
    • month = mar,
    • publisher = {CVF},
    • url = {https://www.merl.com/publications/TR2023-014}
    • }