Publications

633 / 3,922 publications found.


  •  Nikovski, D.N., "Observation-Based Inverse Kinematics for Visual Servo Control", 22nd International Conference on Informatics in Control, Automation and Robotics (ICINCO), October 2025.
    BibTeX TR2025-153 PDF
    • @inproceedings{Nikovski2025oct,
    • author = {Nikovski, Daniel N.},
    • title = {{Observation-Based Inverse Kinematics for Visual Servo Control}},
    • booktitle = {22nd International Conference on Informatics in Control, Automation and Robotics (ICINCO)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-153}
    • }
  •  Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "Radar-Conditioned 3D Bounding Box Diffusion for Indoor Human Perception", IEEE International Conference on Computer Vision (ICCV) Workshop, October 2025.
    BibTeX TR2025-154 PDF
    • @inproceedings{Yataka2025oct,
    • author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
    • title = {{Radar-Conditioned 3D Bounding Box Diffusion for Indoor Human Perception}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshop},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-154}
    • }
  •  Piedade, V., Chitturi, S., Gaspar, J., Govindu, V., Miraldo, P., "SAC-GNC: SAmple Consensus for adaptive Graduated Non-Convexity", IEEE International Conference on Computer Vision (ICCV), October 2025.
    BibTeX TR2025-146 PDF Presentation
    • @inproceedings{Piedade2025oct,
    • author = {{{Piedade, Valter and Chitturi, Sidhartha and Gaspar, Jose and Govindu, Venu and Miraldo, Pedro}}},
    • title = {{{SAC-GNC: SAmple Consensus for adaptive Graduated Non-Convexity}}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-146}
    • }
  •  Yang, C.-A., Peng, K.-C., Yeh, R., "Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts", IEEE International Conference on Computer Vision (ICCV), October 2025.
    BibTeX TR2025-124 PDF Video Data Presentation
    • @inproceedings{Yang2025oct,
    • author = {{{Yang, Chiao-An and Peng, Kuan-Chuan and Yeh, Raymond}}},
    • title = {{{Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts}}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-124}
    • }
  •  Peng, K.-C., "Joint Training of Image Generator and Detector for Road Defect Detection", IEEE International Conference on Computer Vision (ICCV) Workshops, October 2025.
    BibTeX TR2025-149 PDF Video Presentation
    • @inproceedings{Peng2025oct,
    • author = {{{Peng, Kuan-Chuan}}},
    • title = {{{Joint Training of Image Generator and Detector for Road Defect Detection}}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshops},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-149}
    • }
  •  Karumanchi, S., Rokaha, B., Schperberg, A., Vinod, A.P., "Energy-constrained multi-robot exploration for autonomous map building", IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), October 2025.
    BibTeX TR2025-131 PDF
    • @inproceedings{Karumanchi2025oct,
    • author = {Karumanchi, Sambhu and Rokaha, Bhagawan and Schperberg, Alexander and Vinod, Abraham P.},
    • title = {{Energy-constrained multi-robot exploration for autonomous map building}},
    • booktitle = {IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-131}
    • }
  •  Shenoy, V., Wu, S., Comas, A., Lohit, S., Mansour, H., Marks, T.K., "Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography", IEEE Access, October 2025.
    BibTeX TR2025-145 PDF
    • @article{Shenoy2025oct,
    • author = {Shenoy, Vineet and Wu, Shaoju and Comas, Armand and Lohit, Suhas and Mansour, Hassan and Marks, Tim K.},
    • title = {{Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography}},
    • journal = {IEEE Access},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-145}
    • }
  •  Zhang, J., Cherian, A., Rodriguez, C., Deng, W., Gould, S., "Manual-PA: Learning 3D Part Assembly from Instruction Diagrams", IEEE International Conference on Computer Vision (ICCV), September 2025.
    BibTeX TR2025-139 PDF
    • @inproceedings{Zhang2025sep,
    • author = {Zhang, Jiahao and Cherian, Anoop and Rodriguez, Cristian and Deng, Weijian and Gould, Stephen},
    • title = {{Manual-PA: Learning 3D Part Assembly from Instruction Diagrams}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV)},
    • year = 2025,
    • month = sep,
    • url = {https://www.merl.com/publications/TR2025-139}
    • }
  •  Hu, Y., Lohit, S., Kamilov, U., Marks, T.K., "Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal", IEEE Transactions on Geoscience and Remote Sensing, DOI: 10.1109/​TGRS.2025.3604654, Vol. 63, September 2025.
    BibTeX TR2025-138 PDF
    • @article{Hu2025sep2,
    • author = {Hu, Yuyang and Lohit, Suhas and Kamilov, Ulugbek and Marks, Tim K.},
    • title = {{Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal}},
    • journal = {IEEE Transactions on Geoscience and Remote Sensing},
    • year = 2025,
    • volume = 63,
    • month = sep,
    • doi = {10.1109/TGRS.2025.3604654},
    • issn = {1558-0644},
    • url = {https://www.merl.com/publications/TR2025-138}
    • }
  •  Wang, J.-W., Nikovski, D.N., "State Representation Learning for Visual Servo Control", European Control Conference (ECC), June 2025.
    BibTeX TR2025-094 PDF
    • @inproceedings{Wang2025jun,
    • author = {Wang, Jen-Wei and Nikovski, Daniel N.},
    • title = {{State Representation Learning for Visual Servo Control}},
    • booktitle = {European Control Conference (ECC)},
    • year = 2025,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2025-094}
    • }
  •  Jung, Y.G., Park, J., Yoon, J., Peng, K.-C., Kim, W., Teoh, A.B.J., Camps, O., "TailedCore: Few-Shot Sampling for Unsupervised Long-Tail Noisy Anomaly Detection", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), Isola, P. and Kjellström, H. and Lepetit, V. and Li, F. and Su, H. and Tang, S., Eds., DOI: 10.1109/​CVPR52734.2025.02378, June 2025, pp. 25539-25548.
    BibTeX TR2025-077 PDF Video Presentation
    • @inproceedings{Jung2025jun,
    • author = {{{Jung, Yoon G. and Park, Jaewoo and Yoon, Jaeho and Peng, Kuan-Chuan and Kim, Wonchul and Teoh, Andrew B. J. and Camps, Octavia}}},
    • title = {{{TailedCore: Few-Shot Sampling for Unsupervised Long-Tail Noisy Anomaly Detection}}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2025,
    • editor = {Isola, P. and Kjellström, H. and Lepetit, V. and Li, F. and Su, H. and Tang, S.},
    • pages = {25539--25548},
    • month = jun,
    • publisher = {IEEE},
    • doi = {10.1109/CVPR52734.2025.02378},
    • issn = {2575-7075},
    • isbn = {979-8-3315-4364-8},
    • url = {https://www.merl.com/publications/TR2025-077}
    • }
  •  Lai, Y.-H., Ebbers, J., Wang, Y.-C.F., Germain, F.G., Jones, M.J., Chatterjee, M., "UWAV: Uncertainty-weighted Weakly-supervised Audio-Visual Video Parsing", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR52734.2025.01266, June 2025, pp. 13561-13570.
    BibTeX TR2025-072 PDF
    • @inproceedings{Lai2025jun,
    • author = {Lai, Yung-Hsuan and Ebbers, Janek and Wang, Yu-Chiang Frank and Germain, François G and Jones, Michael J. and Chatterjee, Moitreya},
    • title = {{UWAV: Uncertainty-weighted Weakly-supervised Audio-Visual Video Parsing}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2025,
    • pages = {13561--13570},
    • month = jun,
    • publisher = {IEEE},
    • doi = {10.1109/CVPR52734.2025.01266},
    • url = {https://www.merl.com/publications/TR2025-072}
    • }
  •  Hegde, D., Lohit, S., Peng, K.-C., Jones, M.J., Patel, V.M., "Multimodal 3D Object Detection on Unseen Domains", IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop, June 2025, pp. 2499-2509.
    BibTeX TR2025-078 PDF
    • @inproceedings{Hegde2025jun,
    • author = {Hegde, Deepti and Lohit, Suhas and Peng, Kuan-Chuan and Jones, Michael J. and Patel, Vishal M.},
    • title = {{Multimodal 3D Object Detection on Unseen Domains}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop},
    • year = 2025,
    • pages = {2499--2509},
    • month = jun,
    • url = {https://www.merl.com/publications/TR2025-078}
    • }
  •  Li, K., Zhang, T., Peng, K.-C., Wang, G., "PF3Det: A Prompted Foundation Feature Assisted Visual LiDAR 3D Detector", IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop, June 2025, pp. 3787-3796.
    BibTeX TR2025-076 PDF Presentation
    • @inproceedings{Li2025jun,
    • author = {{{Li, Kaidong and Zhang, Tianxiao and Peng, Kuan-Chuan and Wang, Guanghui}}},
    • title = {{{PF3Det: A Prompted Foundation Feature Assisted Visual LiDAR 3D Detector}}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop},
    • year = 2025,
    • pages = {3787--3796},
    • month = jun,
    • url = {https://www.merl.com/publications/TR2025-076}
    • }
  •  Sawada, N., Miraldo, P., Lohit, S., Marks, T.K., Chatterjee, M., "FreBIS: Frequency-Based Stratification for Neural Implicit Surface Representations", IEEE Conference on Computer Vision and Pattern Recognition Workshop (CVPR), DOI: 10.1109/​CVPRW67362.2025.00041, June 2025, pp. 369-379.
    BibTeX TR2025-074 PDF
    • @inproceedings{Sawada2025jun,
    • author = {Sawada, Naoko and Miraldo, Pedro and Lohit, Suhas and Marks, Tim K. and Chatterjee, Moitreya},
    • title = {{FreBIS: Frequency-Based Stratification for Neural Implicit Surface Representations}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition Workshop (CVPR)},
    • year = 2025,
    • pages = {369--379},
    • month = jun,
    • doi = {10.1109/CVPRW67362.2025.00041},
    • url = {https://www.merl.com/publications/TR2025-074}
    • }
  •  Ni, Y., Wen, S., Koniusz, P., Cherian, A., "Noise Consistency Regularization for Improved Subject-Driven Image Synthesis", IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPR), June 2025, pp. 3116-3126.
    BibTeX TR2025-073 PDF
    • @inproceedings{Ni2025jun,
    • author = {Ni, Yao and Wen, Song and Koniusz, Piotr and Cherian, Anoop},
    • title = {{Noise Consistency Regularization for Improved Subject-Driven Image Synthesis}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPR)},
    • year = 2025,
    • pages = {3116--3126},
    • month = jun,
    • publisher = {CVF},
    • url = {https://www.merl.com/publications/TR2025-073}
    • }
  •  Lu, K., Ma, C., Hori, C., Romeres, D., "KitchenVLA: Iterative Vision-Language Corrections for Robotic Execution of Human Tasks", IEEE International Conference on Robotics and Automation Workshop on Safely Leveraging Vision-Language Foundation Models in Robotics (SafeLVMs@ICRA), May 2025.
    BibTeX TR2025-068 PDF
    • @inproceedings{Lu2025may,
    • author = {Lu, Kai and Ma, Chenyang and Hori, Chiori and Romeres, Diego},
    • title = {{KitchenVLA: Iterative Vision-Language Corrections for Robotic Execution of Human Tasks}},
    • booktitle = {IEEE International Conference on Robotics and Automation Workshop on Safely Leveraging Vision-Language Foundation Models in Robotics (SafeLVMs@ICRA)},
    • year = 2025,
    • month = may,
    • url = {https://www.merl.com/publications/TR2025-068}
    • }
  •  Singh, A., Jones, M.J., Peng, K.-C., Chatterjee, M., Cherian, A., Learned-Miller, E., "Improving Open-World Object Localization by Discovering Background", CVPR Workshop on Domain Generalization: Evolution, Breakthroughs and Future Horizon, May 2025, pp. 6449-6458.
    BibTeX TR2025-058 PDF
    • @inproceedings{Singh2025may,
    • author = {Singh, Ashish and Jones, Michael J. and Peng, Kuan-Chuan and Chatterjee, Moitreya and Cherian, Anoop and Learned-Miller, Erik},
    • title = {{Improving Open-World Object Localization by Discovering Background}},
    • booktitle = {CVPR Workshop on Domain Generalization: Evolution, Breakthroughs and Future Horizon},
    • year = 2025,
    • pages = {6449--6458},
    • month = may,
    • url = {https://www.merl.com/publications/TR2025-058}
    • }
  •  Basu, S., Lohit, S., Brand, M., "G-RepsNet: A Lightweight Construction of Equivariant Net- works for Arbitrary Matrix Groups", Transactions on Machine Learning Research (TMLR), May 2025.
    BibTeX TR2025-056 PDF Software
    • @article{Basu2025may,
    • author = {Basu, Sourya and Lohit, Suhas and Brand, Matthew},
    • title = {{G-RepsNet: A Lightweight Construction of Equivariant Net- works for Arbitrary Matrix Groups}},
    • journal = {Transactions on Machine Learning Research (TMLR)},
    • year = 2025,
    • month = may,
    • issn = {2835-8856},
    • url = {https://www.merl.com/publications/TR2025-056}
    • }
  •  Tang, H., Ellis, K., Lohit, S., Jones, M.J., Chatterjee, M., "Programmatic Video Prediction Using Large Language Models", International Conference on Learning Representations Workshops (ICLRW), April 2025.
    BibTeX TR2025-049 PDF
    • @inproceedings{Tang2025apr,
    • author = {Tang, Hao and Ellis, Kevin and Lohit, Suhas and Jones, Michael J. and Chatterjee, Moitreya},
    • title = {{Programmatic Video Prediction Using Large Language Models}},
    • booktitle = {International Conference on Learning Representations Workshops (ICLRW)},
    • year = 2025,
    • month = apr,
    • url = {https://www.merl.com/publications/TR2025-049}
    • }
  •  Hori, C., Kambara, M., Sugiura, K., Ota, K., Khurana, S., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Interactive Robot Action Replanning using Multimodal LLM Trained from Human Demonstration Videos", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10887717, April 2025.
    BibTeX TR2025-034 PDF
    • @inproceedings{Hori2025mar,
    • author = {Hori, Chiori and Kambara, Motonari and Sugiura, Komei and Ota, Kei and Khurana, Sameer and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
    • title = {{Interactive Robot Action Replanning using Multimodal {LLM} Trained from Human Demonstration Videos}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • doi = {10.1109/ICASSP49660.2025.10887717},
    • url = {https://www.merl.com/publications/TR2025-034}
    • }
  •  Ranade, S., Pais, G., Whitaker, R., Nascimento, J., Miraldo, P., Ramalingam, S., "SurfR: Surface Reconstruction with Multi-scale Attention", International Conference on 3D Vision (3DV), March 2025.
    BibTeX TR2025-039 PDF Presentation
    • @inproceedings{Ranade2025mar,
    • author = {{{Ranade, Siddhant and Pais, Goncalo and Whitaker, Ross and Nascimento, Jacinto and Miraldo, Pedro and Ramalingam, Srikumar}}},
    • title = {{{SurfR: Surface Reconstruction with Multi-scale Attention}}},
    • booktitle = {International Conference on 3D Vision (3DV)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-039}
    • }
  •  Wang, Y., Peng, K.-C., Fu, R., "Towards Zero-shot 3D Anomaly Localization", IEEE Winter Conference on Applications of Computer Vision (WACV), Biswas, S. and Averbuch-Elor, H. and Štruc, V. and Yang, Y., Eds., DOI: 10.1109/​WACV61041.2025.00148, February 2025, pp. 1447-1456.
    BibTeX TR2025-020 PDF Video Presentation
    • @inproceedings{Wang2025feb2,
    • author = {Wang, Yizhou and Peng, Kuan-Chuan and Fu, Raymond},
    • title = {{Towards Zero-shot 3D Anomaly Localization}},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2025,
    • editor = {Biswas, S. and Averbuch-Elor, H. and Štruc, V. and Yang, Y.},
    • pages = {1447--1456},
    • month = feb,
    • publisher = {IEEE},
    • doi = {10.1109/WACV61041.2025.00148},
    • issn = {2642-9381},
    • isbn = {979-8-3315-1083-1},
    • url = {https://www.merl.com/publications/TR2025-020}
    • }
  •  Mumcu, F., Jones, M.J., Yilmaz, Y., Cherian, A., "ComplexVAD: Detecting Interaction Anomalies in Video", IEEE Winter Conference on Applications of Computer Vision (WACV) Workshop, DOI: 10.1109/​WACVW65960.2025.00122, February 2025.
    BibTeX TR2025-016 PDF Data
    • @inproceedings{Mumcu2025feb,
    • author = {Mumcu, Furkan and Jones, Michael J. and Yilmaz, Yasin and Cherian, Anoop},
    • title = {{ComplexVAD: Detecting Interaction Anomalies in Video}},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV) Workshop},
    • year = 2025,
    • month = feb,
    • doi = {10.1109/WACVW65960.2025.00122},
    • url = {https://www.merl.com/publications/TR2025-016}
    • }
  •  Lohit, S., Marks, T.K., "Rotation-Equivariant Neural Networks for Cloud Removal from Satellite Images", Asilomar Conference on Signals, Systems, and Computers (ACSSC), DOI: 10.1109/​IEEECONF60004.2024.10942613, January 2025, pp. 1360-1365.
    BibTeX TR2025-009 PDF
    • @inproceedings{Lohit2025jan,
    • author = {Lohit, Suhas and Marks, Tim K.},
    • title = {{Rotation-Equivariant Neural Networks for Cloud Removal from Satellite Images}},
    • booktitle = {2024 58th Asilomar Conference on Signals, Systems, and Computers (ACSSC)},
    • year = 2025,
    • pages = {1360--1365},
    • month = jan,
    • publisher = {IEEE},
    • doi = {10.1109/IEEECONF60004.2024.10942613},
    • issn = {2576-2303},
    • isbn = {979-8-3503-5405-8},
    • url = {https://www.merl.com/publications/TR2025-009}
    • }