Publications

653 / 4,036 publications found.


  •  Cherian, A., Lohit, S., Peng, K.-C., "WISE: Weighted Iterative Society-of-Experts for Multimodal Multi-Agent Debate with Probabilistic Consensus", ICML SCALE AI Workshop, June 2026.
    BibTeX TR2026-083 PDF
    • @inproceedings{Cherian2026jun,
    • author = {Cherian, Anoop and Lohit, Suhas and Peng, Kuan-Chuan},
    • title = {{WISE: Weighted Iterative Society-of-Experts for Multimodal Multi-Agent Debate with Probabilistic Consensus}},
    • booktitle = {ICML SCALE AI Workshop},
    • year = 2026,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2026-083}
    • }
  •  Zhou, Q., Gan, C., Cherian, A., "LLawCo: Learning Laws of Cooperation for Modeling Embodied Multi-Agent Behavior", International Conference on Machine Learning (ICML), June 2026.
    BibTeX TR2026-081 PDF
    • @inproceedings{Zhou2026jun,
    • author = {Zhou, Qinhong and Gan, Chuang and Cherian, Anoop},
    • title = {{LLawCo: Learning Laws of Cooperation for Modeling Embodied Multi-Agent Behavior}},
    • booktitle = {International Conference on Machine Learning (ICML)},
    • year = 2026,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2026-081}
    • }
  •  Hsieh, J.-W., Wu, Y.-H., Hsieh, Y.-K., Li, X., Peng, K.-C., Chang, M.-C., "SoREL: Soft-Label Refurbishment with Ensemble Learning for Noisy Long-Tailed Classification", CVPR Findings, June 2026.
    BibTeX TR2026-075 PDF
    • @inproceedings{Hsieh2026jun2,
    • author = {Hsieh, Jun-Wei and Wu, Ying-Hsuan and Hsieh, Yi-Kuan and Li, Xin and Peng, Kuan-Chuan and Chang, Ming-Ching},
    • title = {{SoREL: Soft-Label Refurbishment with Ensemble Learning for Noisy Long-Tailed Classification}},
    • booktitle = {CVPR Findings},
    • year = 2026,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2026-075}
    • }
  •  Hsieh, J.-W., Wu, Y.-H., Hsieh, Y.-K., Li, X., Peng, K.-C., Chang, M.-C., "SoREL: Soft-Label Refurbishment with Ensemble Learning for Noisy Long-Tailed Classification Supplementary Material", CVPR Findings, June 2026.
    BibTeX TR2026-074 PDF
    • @inproceedings{Hsieh2026jun,
    • author = {Hsieh, Jun-Wei and Wu, Ying-Hsuan and Hsieh, Yi-Kuan and Li, Xin and Peng, Kuan-Chuan and Chang, Ming-Ching},
    • title = {{SoREL: Soft-Label Refurbishment with Ensemble Learning for Noisy Long-Tailed Classification Supplementary Material}},
    • booktitle = {CVPR Findings},
    • year = 2026,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2026-074}
    • }
  •  Li, D., Zhang, J., Egger, B., Chatterjee, M., Lohit, S., Marks, T.K., Cherian, A., "AssemblyBench: Physics-Aware Assembly of Complex Industrial Objects", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2026.
    BibTeX TR2026-076 PDF Video Data Software
    • @inproceedings{Li2026jun,
    • author = {Li, Danrui and Zhang, Jiahao and Egger, Bernhard and Chatterjee, Moitreya and Lohit, Suhas and Marks, Tim K. and Cherian, Anoop},
    • title = {{AssemblyBench: Physics-Aware Assembly of Complex Industrial Objects}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2026,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2026-076}
    • }
  •  Liu, X., Miraldo, P., Lohit, S., Jiang, H., Sawada, N., Tai, Y.-W., Tang, C.-K., Chatterjee, M., "Point4Cast: Streaming Dynamic Scene Reconstruction and Forecasting", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2026.
    BibTeX TR2026-077 PDF
    • @inproceedings{Liu2026jun,
    • author = {Liu, Xinhang and Miraldo, Pedro and Lohit, Suhas and Jiang, Huaizu and Sawada, Naoko and Tai, Yu-Wing and Tang, Chi-Keung and Chatterjee, Moitreya},
    • title = {{Point4Cast: Streaming Dynamic Scene Reconstruction and Forecasting}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2026,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2026-077}
    • }
  •  Jain, S., Choi, H.J., "SplatCtrl: Perception–Action Coupling via Gaussian Scene Representations and Reactive Robot Control", 2026 IEEE International Conference on Robotics & Automation (ICRA), June 2026.
    BibTeX TR2026-069 PDF
    • @inproceedings{Jain2026jun,
    • author = {{Jain, Siddarth and Choi, Ho Jin}},
    • title = {{SplatCtrl: Perception–Action Coupling via Gaussian Scene Representations and Reactive Robot Control}},
    • booktitle = {2026 IEEE International Conference on Robotics \& Automation (ICRA)},
    • year = 2026,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2026-069}
    • }
  •  Velentzas, I.G., Tomita, K., "LIDIA: Localizing In the Dark with Illumination-Awareness toward Perception-Aware Planning", IEEE International Conference on Robotics and Automation (ICRA), June 2026.
    BibTeX TR2026-071 PDF
    • @inproceedings{Velentzas2026jun,
    • author = {{Velentzas, I.G. and Tomita, K.}},
    • title = {{LIDIA: Localizing In the Dark with Illumination-Awareness toward Perception-Aware Planning}},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2026,
    • month = jun,
    • url = {https://www.merl.com/publications/TR2026-071}
    • }
  •  Ding, T., Xie, Y., Liang, Y., Chatterjee, M., Miraldo, P., Jiang, H., "LASER: Layer-wise Scale Alignment for Training-Free Streaming 4D Reconstruction", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), May 2026.
    BibTeX TR2026-055 PDF
    • @inproceedings{Ding2026may,
    • author = {Ding, Tianye and Xie, Yiming and Liang, Yiqing and Chatterjee, Moitreya and Miraldo, Pedro and Jiang, Huaizu},
    • title = {{LASER: Layer-wise Scale Alignment for Training-Free Streaming 4D Reconstruction}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2026,
    • month = may,
    • url = {https://www.merl.com/publications/TR2026-055}
    • }
  •  Manam, L., Govindu, V., "Parallel Rigidity Matters for Bundle Adjustment", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), May 2026, pp. 29035-29046.
    BibTeX TR2026-053 PDF Video Presentation
    • @inproceedings{Lalit2026may,
    • author = {{Manam, Lalit and Govindu, Venu}},
    • title = {{Parallel Rigidity Matters for Bundle Adjustment}},
    • booktitle = {IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2026,
    • pages = {29035--29046},
    • month = may,
    • url = {https://www.merl.com/publications/TR2026-053}
    • }
  •  Piedade, V., Manam, L., Yamazaki, M., Miraldo, P., "Revisiting Monocular SLAM with Spatio-Temporal Scene Modeling", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), May 2026.
    BibTeX TR2026-056 PDF Video Software Presentation
    • @inproceedings{Piedade2026may,
    • author = {{Piedade, Valter and Manam, Lalit and Yamazaki, Masashi and Miraldo, Pedro}},
    • title = {{Revisiting Monocular SLAM with Spatio-Temporal Scene Modeling}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2026,
    • month = may,
    • url = {https://www.merl.com/publications/TR2026-056}
    • }
  •  Cherian, A., Corcodel, R., Jain, S., Romeres, D., "LLMPhy: Parameter-Identifiable Physical Reasoning Combining Large Language Models and Physics Engines", International Conference on Artificial Intelligence and Statistics (AISTATS), May 2026.
    BibTeX TR2026-052 PDF Data Software
    • @inproceedings{Cherian2026may,
    • author = {Cherian, Anoop and Corcodel, Radu and Jain, Siddarth and Romeres, Diego},
    • title = {{LLMPhy: Parameter-Identifiable Physical Reasoning Combining Large Language Models and Physics Engines}},
    • booktitle = {International Conference on Artificial Intelligence and Statistics (AISTATS)},
    • year = 2026,
    • month = may,
    • url = {https://www.merl.com/publications/TR2026-052}
    • }
  •  Shenoy, V., Lohit, S., Mansour, H., Chellappa, R., Marks, T.K., "Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models", IEEE Transactions on Image Processing, DOI: 10.1109/​TIP.2026.3671653, Vol. 35, pp. 2755-2770, March 2026.
    BibTeX TR2026-031 PDF
    • @article{Shenoy2026mar,
    • author = {Shenoy, Vineet and Lohit, Suhas and Mansour, Hassan and Chellappa, Rama and Marks, Tim K.},
    • title = {{Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models}},
    • journal = {IEEE Transactions on Image Processing},
    • year = 2026,
    • volume = 35,
    • pages = {2755--2770},
    • month = mar,
    • doi = {10.1109/TIP.2026.3671653},
    • issn = {1941-0042},
    • url = {https://www.merl.com/publications/TR2026-031}
    • }
  •  Kogashi, K., Cherian, A., Kuo, M.-Y.J., "MMHOI: Modeling Complex 3D Multi-Human Multi-Object Interactions", IEEE Winter Conference on Applications of Computer Vision (WACV), March 2026, pp. 1512-1521.
    BibTeX TR2026-029 PDF Video Data
    • @inproceedings{Kogashi2026mar,
    • author = {Kogashi, Kaen and Cherian, Anoop and Kuo, Meng-Yu Jennifer},
    • title = {{MMHOI: Modeling Complex 3D Multi-Human Multi-Object Interactions}},
    • booktitle = {IEEE Winter Conference on Applications of Computer Vision (WACV)},
    • year = 2026,
    • pages = {1512--1521},
    • month = mar,
    • url = {https://www.merl.com/publications/TR2026-029}
    • }
  •  Mumcu, F., Jones, M.J., Yilmaz, Y., Cherian, A., "Leveraging Multimodal LLM Descriptions of Activity for Explainable Semi-Supervised Video Anomaly Detection", Transactions on Machine Learning Research, February 2026.
    BibTeX TR2026-027 PDF
    • @article{Mumcu2026feb2,
    • author = {Mumcu, Furkan and Jones, Michael J. and Yilmaz, Yasin and Cherian, Anoop},
    • title = {{Leveraging Multimodal LLM Descriptions of Activity for Explainable Semi-Supervised Video Anomaly Detection}},
    • journal = {Transactions on Machine Learning Research},
    • year = 2026,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2026-027}
    • }
  •  Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "Indoor Multi-View Radar Object Detection via 3D Bounding Box Diffusion", AAAI Conference on Artificial Intelligence, DOI: 10.1609/​aaai.v40i22.38939, January 2026, vol. 40, pp. 18710-18718.
    BibTeX TR2026-019 PDF Software
    • @inproceedings{Yataka2026jan,
    • author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
    • title = {IIndoor Multi-View Radar Object Detection via 3D Bounding Box Diffusion},
    • booktitle = {AAAI Conference on Artificial Intelligence},
    • year = 2026,
    • volume = 40,
    • number = 22,
    • pages = {18710--18718},
    • month = jan,
    • doi = {10.1609/aaai.v40i22.38939},
    • url = {https://www.merl.com/publications/TR2026-019}
    • }
  •  Kuwabara, A., Kato, S., Koike-Akino, T., Fujihashi, T., "Date of publication xxxx 00, 0000, date of current version xxxx 00, 0000. Digital Object Identifier 10.1109/ACCESS.2017.DOI Range Image-Based Implicit Neural Compression for LiDAR Point Clouds", IEEE Access, DOI: 10.1109/​ACCESS.2026.3654068, Vol. 14, pp. 10262-10275, January 2026.
    BibTeX TR2026-023 PDF
    • @article{Kuwabara2026feb,
    • author = {Kuwabara, Akihiro and Kato, Sorachi and Koike-Akino, Toshiaki and Fujihashi, Takuya},
    • title = {{Range Image-Based Implicit Neural Compression for LiDAR Point Clouds}},
    • journal = {IEEE Access},
    • year = 2026,
    • volume = 14,
    • pages = {10262--10275},
    • month = feb,
    • doi = {10.1109/ACCESS.2026.3654068},
    • issn = {2169-3536},
    • url = {https://www.merl.com/publications/TR2026-023}
    • }
  •  Hori, C., Masuyama, Y., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Robot Confirmation Generation and Action Planning Using Long-context Q-Former Integrated with Multimodal LLM", IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), DOI: 10.1109/​ASRU65441.2025.11434641, December 2025.
    BibTeX TR2025-167 PDF
    • @inproceedings{Hori2025dec,
    • author = {Hori, Chiori and Masuyama, Yoshiki and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
    • title = {{Robot Confirmation Generation and Action Planning Using Long-context Q-Former Integrated with Multimodal LLM}},
    • booktitle = {IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
    • year = 2025,
    • month = dec,
    • doi = {10.1109/ASRU65441.2025.11434641},
    • issn = {2997-6995},
    • isbn = {979-8-3315-4426-3},
    • url = {https://www.merl.com/publications/TR2025-167}
    • }
  •  Xiang, X., Peng, K.-C., Lohit, S., Jones, M.J., Zhang, J., "Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes", British Machine Vision Conference (BMVC), November 2025.
    BibTeX TR2025-162 PDF Video Data Presentation
    • @inproceedings{Xiang2025nov,
    • author = {{{Xiang, Xinhao and Peng, Kuan-Chuan and Lohit, Suhas and Jones, Michael J. and Zhang, Jiawei}}},
    • title = {{{Towards Open-Vocabulary Multimodal 3D Object Detection with Attributes}}},
    • booktitle = {British Machine Vision Conference (BMVC)},
    • year = 2025,
    • month = nov,
    • url = {https://www.merl.com/publications/TR2025-162}
    • }
  •  Gambill, P., Jha, D.K., Krishnamoorthy, B., Raghunathan, A., Yerazunis, W.S., "DamageEst: Accurate Estimation of Damage for Repair using Additive Manufacturing", Solid Freeform Fabrication Symposium (SFF), November 2025, pp. 1506-1526.
    BibTeX TR2025-158 PDF Presentation
    • @inproceedings{Gambill2025nov,
    • author = {{{Gambill, Patrick and Jha, Devesh K. and Krishnamoorthy, Bala and Raghunathan, Arvind and Yerazunis, William S.}}},
    • title = {{{DamageEst: Accurate Estimation of Damage for Repair using Additive Manufacturing}}},
    • booktitle = {36th Annual International Solid Freeform Fabrication Symposium – An Additive Manufacturing Conference},
    • year = 2025,
    • pages = {1506--1526},
    • month = nov,
    • url = {https://www.merl.com/publications/TR2025-158}
    • }
  •  Nikovski, D.N., "Observation-Based Inverse Kinematics for Visual Servo Control", 22nd International Conference on Informatics in Control, Automation and Robotics (ICINCO), DOI: 10.5220/​0013701100003982, October 2025, pp. 200-207.
    BibTeX TR2025-153 PDF
    • @inproceedings{Nikovski2025oct,
    • author = {Nikovski, Daniel N.},
    • title = {{Observation-Based Inverse Kinematics for Visual Servo Control}},
    • booktitle = {22nd International Conference on Informatics in Control, Automation and Robotics (ICINCO)},
    • year = 2025,
    • pages = {200--207},
    • month = oct,
    • publisher = {SciTePress},
    • doi = {10.5220/0013701100003982},
    • isbn = {978-989-758-770-2},
    • url = {https://www.merl.com/publications/TR2025-153}
    • }
  •  Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "Radar-Conditioned 3D Bounding Box Diffusion for Indoor Human Perception", IEEE International Conference on Computer Vision (ICCV) Workshop, October 2025.
    BibTeX TR2025-154 PDF Software
    • @inproceedings{Yataka2025oct,
    • author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
    • title = {{Radar-Conditioned 3D Bounding Box Diffusion for Indoor Human Perception}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshop},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-154}
    • }
  •  Piedade, V., Chitturi, S., Gaspar, J., Govindu, V., Miraldo, P., "SAC-GNC: SAmple Consensus for adaptive Graduated Non-Convexity", IEEE International Conference on Computer Vision (ICCV), DOI: 10.1109/​ICCV51701.2025.00547, October 2025, pp. 5780-5790.
    BibTeX TR2025-146 PDF Video Software Presentation
    • @inproceedings{Piedade2025oct,
    • author = {{{Piedade, Valter and Chitturi, Sidhartha and Gaspar, Jose and Govindu, Venu and Miraldo, Pedro}}},
    • title = {{{SAC-GNC: SAmple Consensus for adaptive Graduated Non-Convexity}}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV)},
    • year = 2025,
    • pages = {5780--5790},
    • month = oct,
    • doi = {10.1109/ICCV51701.2025.00547},
    • url = {https://www.merl.com/publications/TR2025-146}
    • }
  •  Yang, C.-A., Peng, K.-C., Yeh, R., "Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts", IEEE International Conference on Computer Vision (ICCV), October 2025.
    BibTeX TR2025-124 PDF Video Data Presentation
    • @inproceedings{Yang2025oct,
    • author = {{{Yang, Chiao-An and Peng, Kuan-Chuan and Yeh, Raymond}}},
    • title = {{{Toward Long-Tailed Online Anomaly Detection through Class-Agnostic Concepts}}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV)},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-124}
    • }
  •  Peng, K.-C., "Joint Training of Image Generator and Detector for Road Defect Detection", IEEE International Conference on Computer Vision (ICCV) Workshops, October 2025.
    BibTeX TR2025-149 PDF Video Presentation
    • @inproceedings{Peng2025oct,
    • author = {{{Peng, Kuan-Chuan}}},
    • title = {{{Joint Training of Image Generator and Detector for Road Defect Detection}}},
    • booktitle = {IEEE International Conference on Computer Vision (ICCV) Workshops},
    • year = 2025,
    • month = oct,
    • url = {https://www.merl.com/publications/TR2025-149}
    • }