In: Stephanidis, Constantine; Antona, Margherita; Ntoa, Stavroula; Salvendy, Gavriel (Ed.): HCI International 2025 Posters, vol. 2529, pp. 436–443, Springer Nature Switzerland, Cham, 2025, ISBN: 978-3-031-94170-2 978-3-031-94171-9, (Series Title: Communications in Computer and Information Science).

Links | BibTeX

35.

Hu, Yue; Liu, Rong; Chen, Meida; Beerel, Peter; Feng, Andrew

SplatMAP: Online Dense Monocular SLAM with 3D Gaussian Splatting Miscellaneous

2025, (arXiv:2501.07015 [cs]).

Abstract | Links | BibTeX

@misc{hu_splatmap_2025,

title = {SplatMAP: Online Dense Monocular SLAM with 3D Gaussian Splatting},

author = {Yue Hu and Rong Liu and Meida Chen and Peter Beerel and Andrew Feng},

url = {http://arxiv.org/abs/2501.07015},

doi = {10.48550/arXiv.2501.07015},

year  = {2025},

date = {2025-01-01},

urldate = {2025-01-16},

publisher = {arXiv},

abstract = {Achieving high-fidelity 3D reconstruction from monocular video remains challenging due to the inherent limitations of traditional methods like Structure-from-Motion (SfM) and monocular SLAM in accurately capturing scene details. While differentiable rendering techniques such as Neural Radiance Fields (NeRF) address some of these challenges, their high computational costs make them unsuitable for real-time applications. Additionally, existing 3D Gaussian Splatting (3DGS) methods often focus on photometric consistency, neglecting geometric accuracy and failing to exploit SLAM's dynamic depth and pose updates for scene refinement. We propose a framework integrating dense SLAM with 3DGS for real-time, high-fidelity dense reconstruction. Our approach introduces SLAM-Informed Adaptive Densification, which dynamically updates and densifies the Gaussian model by leveraging dense point clouds from SLAM. Additionally, we incorporate Geometry-Guided Optimization, which combines edge-aware geometric constraints and photometric consistency to jointly optimize the appearance and geometry of the 3DGS scene representation, enabling detailed and accurate SLAM mapping reconstruction. Experiments on the Replica and TUM-RGBD datasets demonstrate the effectiveness of our approach, achieving state-of-the-art results among monocular systems. Specifically, our method achieves a PSNR of 36.864, SSIM of 0.985, and LPIPS of 0.040 on Replica, representing improvements of 10.7%, 6.4%, and 49.4%, respectively, over the previous SOTA. On TUM-RGBD, our method outperforms the closest baseline by 10.2%, 6.6%, and 34.7% in the same metrics. These results highlight the potential of our framework in bridging the gap between photometric and geometric dense 3D scene representations, paving the way for practical and efficient monocular dense reconstruction.},

note = {arXiv:2501.07015 [cs]},

keywords = {},

pubstate = {published},

tppubtype = {misc}

}

36.

Rizzo, Albert “Skip”; Giosan, Cezar; Deac, George; Zaporozhets, Olya; Syvak, Oksana; Dragayeva, Svetlana; Bodner, Ehud; Mann, Shel; Stone, Jessica

The Virtual Ukraine Project: Trauma Therapy in Warzones with Virtual Reality Book Section

In: Stone, Jessica (Ed.): Mental Health Virtual Reality, pp. 159–180, Wiley, 2025, ISBN: 978-1-394-27845-9 978-1-394-27848-0.

Links | BibTeX

37.

Liu, Rong; Sun, Dylan; Chen, Meida; Wang, Yue; Feng, Andrew

Deformable Beta Splatting Miscellaneous

2025, (arXiv:2501.18630 [cs]).

Abstract | Links | BibTeX

38.

Chang, Di; Xu, Hongyi; Xie, You; Gao, Yipeng; Kuang, Zhengfei; Cai, Shengqu; Zhang, Chenxu; Song, Guoxian; Wang, Chao; Shi, Yichun; Chen, Zeyuan; Zhou, Shijie; Luo, Linjie; Wetzstein, Gordon; Soleymani, Mohammad

X-Dyna: Expressive Dynamic Human Image Animation Miscellaneous

2025, (arXiv:2501.10021 [cs]).

Abstract | Links | BibTeX

39.

Rodrigues, Patrick Borges; Becerik-Gerber, Burcin; Soibelman, Lucio; Lucas, Gale M.; Roll, Shawn C.

Impact of selective environmental sound attenuation on operator performance, stress, attention, and task engagement in teleoperated demolition Journal Article

In: Automation in Construction, vol. 169, pp. 105876, 2025, ISSN: 09265805.

Links | BibTeX

40.

Siniukov, Maksim; Xing, Ellie; Sanaz,; Isfahani, Attaripour; Soleymani, Mohammad

Towards a Generalizable Speech Marker for Parkinson's Disease Diagnosis Miscellaneous

2025, (Version Number: 1).

Abstract | Links | BibTeX

2148 entries « ‹ 2 of 108 › »

Filter

2148 entries « ‹ 2 of 43 › »

2024

Chen, Meida; Han, Kangle; Yu, Zifan; Feng, Andrew; Hou, Yu; You, Suya; Soibelman, Lucio

An Aerial Photogrammetry Benchmark Dataset for Point Cloud Segmentation and Style Translation Journal Article

In: Remote Sensing, vol. 16, no. 22, pp. 4240, 2024, ISSN: 2072-4292.

Abstract | Links | BibTeX | Tags: DTIC, VGL

@article{chen_aerial_2024,

title = {An Aerial Photogrammetry Benchmark Dataset for Point Cloud Segmentation and Style Translation},

author = {Meida Chen and Kangle Han and Zifan Yu and Andrew Feng and Yu Hou and Suya You and Lucio Soibelman},

url = {https://www.mdpi.com/2072-4292/16/22/4240},

doi = {10.3390/rs16224240},

issn = {2072-4292},

year  = {2024},

date = {2024-11-01},

urldate = {2024-12-05},

journal = {Remote Sensing},

volume = {16},

number = {22},

pages = {4240},

abstract = {The recent surge in diverse 3D datasets spanning various scales and applications marks a significant advancement in the field. However, the comprehensive process of data acquisition, refinement, and annotation at a large scale poses a formidable challenge, particularly for individual researchers and small teams. To this end, we present a novel synthetic 3D point cloud generation framework that can produce detailed outdoor aerial photogrammetric 3D datasets with accurate ground truth annotations without the labor-intensive and time-consuming data collection/annotation processes. Our pipeline procedurally generates synthetic environments, mirroring real-world data collection and 3D reconstruction processes. A key feature of our framework is its ability to replicate consistent quality, noise patterns, and diversity similar to real-world datasets. This is achieved by adopting UAV flight patterns that resemble those used in real-world data collection processes (e.g., the cross-hatch flight pattern) across various synthetic terrains that are procedurally generated, thereby ensuring data consistency akin to real-world scenarios. Moreover, the generated datasets are enriched with precise semantic and instance annotations, eliminating the need for manual labeling. Our approach has led to the development and release of the Semantic Terrain Points Labeling—Synthetic 3D (STPLS3D) benchmark, an extensive outdoor 3D dataset encompassing over 16 km2, featuring up to 19 semantic labels. We also collected, reconstructed, and annotated four real-world datasets for validation purposes. Extensive experiments on these datasets demonstrate our synthetic datasets’ effectiveness, superior quality, and their value as a benchmark dataset for further point cloud research.},

keywords = {DTIC, VGL},

pubstate = {published},

tppubtype = {article}

}

Bonial, Claire; Lukin, Stephanie M.; Abrams, Mitchell; Baker, Anthony; Donatelli, Lucia; Foots, Ashley; Hayes, Cory J.; Henry, Cassidy; Hudson, Taylor; Marge, Matthew; Pollard, Kimberly A.; Artstein, Ron; Traum, David; Voss, Clare R.

Human–robot dialogue annotation for multi-modal common ground Journal Article

In: Lang Resources & Evaluation, 2024, ISSN: 1574-020X, 1574-0218.

Links | BibTeX | Tags: DTIC, Virtual Humans

Marti, Deniz; Budathoki, Anjila; Ding, Yi; Lucas, Gale; Nelson, David

How Does Acknowledging Users’ Preferences Impact AI’s Ability to Make Conflicting Recommendations? Journal Article

In: International Journal of Human–Computer Interaction, pp. 1–12, 2024, ISSN: 1044-7318, 1532-7590.

Links | BibTeX | Tags: DTIC, Virtual Humans

Vlake, Johan H; Drop, Denzel L Q; Bommel, Jasper Van; Riva, Giuseppe; Wiederhold, Brenda K; Cipresso, Pietro; Rizzo, Albert S; Rothbaum, Barbara O; Botella, Cristina; Hooft, Lotty; Bienvenu, Oscar J; Jung, Christian; Geerts, Bart; Wils, Evert-Jan; Gommers, Diederik; Genderen, Michel E Van; Group, RATE-XR Expert

Reporting Guidelines for the Early-Phase Clinical Evaluation of Applications Using Extended Reality: RATE-XR Qualitative Study Guideline Journal Article

In: J Med Internet Res, vol. 26, pp. e56790, 2024, ISSN: 1438-8871.

Abstract | Links | BibTeX | Tags: MedVR

@article{vlake_reporting_2024,

title = {Reporting Guidelines for the Early-Phase Clinical Evaluation of Applications Using Extended Reality: RATE-XR Qualitative Study Guideline},

author = {Johan H Vlake and Denzel L Q Drop and Jasper Van Bommel and Giuseppe Riva and Brenda K Wiederhold and Pietro Cipresso and Albert S Rizzo and Barbara O Rothbaum and Cristina Botella and Lotty Hooft and Oscar J Bienvenu and Christian Jung and Bart Geerts and Evert-Jan Wils and Diederik Gommers and Michel E Van Genderen and RATE-XR Expert Group},

url = {https://www.jmir.org/2024/1/e56790},

doi = {10.2196/56790},

issn = {1438-8871},

year  = {2024},

date = {2024-11-01},

urldate = {2024-12-05},

journal = {J Med Internet Res},

volume = {26},

pages = {e56790},

abstract = {Background 

 Extended reality (XR), encompassing technologies such as virtual reality, augmented reality, and mixed reality, has rapidly gained prominence in health care. However, existing XR research often lacks rigor, proper controls, and standardization. 

 Objective 

 To address this and to enhance the transparency and quality of reporting in early-phase clinical evaluations of XR applications, we present the “Reporting for the early-phase clinical evaluation of applications using extended reality” (RATE-XR) guideline. 

 Methods 

 We conducted a 2-round modified Delphi process involving experts from diverse stakeholder categories, and the RATE-XR is therefore the result of a consensus-based, multistakeholder effort. 

 Results 

 The guideline comprises 17 XR-specific (composed of 18 subitems) and 14 generic reporting items, each with a complementary Explanation & Elaboration section. 

 Conclusions 

 The items encompass critical aspects of XR research, from clinical utility and safety to human factors and ethics. By offering a comprehensive checklist for reporting, the RATE-XR guideline facilitates robust assessment and replication of early-stage clinical XR studies. It underscores the need for transparency, patient-centeredness, and balanced evaluation of the applications of XR in health care. By providing an actionable checklist of minimal reporting items, this guideline will facilitate the responsible development and integration of XR technologies into health care and related fields.},

keywords = {MedVR},

pubstate = {published},

tppubtype = {article}

}

Roemmele, Melissa; Gordon, Andrew S.

From Test-Taking to Test-Making: Examining LLM Authoring of Commonsense Assessment Items Miscellaneous

2024, (Version Number: 1).

Abstract | Links | BibTeX | Tags: DTIC, Learning Sciences

Lin, Spencer; Rizk, Basem; Jun, Miru; Artze, Andy; Sullivan, Caitlin; Mozgai, Sharon; Fisher, Scott

Estuary: A Framework For Building Multimodal Low-Latency Real-Time Socially Interactive Agents Miscellaneous

2024, (arXiv:2410.20116 [cs]).

Abstract | Links | BibTeX | Tags: Virtual Agents

Tran, Minh; Kim, Yelin; Su, Che-Chun; Kuo, Cheng-Hao; Sun, Min; Soleymani, Mohammad

Ex2Eg-MAE: A Framework for Adaptation of Exocentric Video Masked Autoencoders for Egocentric Social Role Understanding Book Section

In: Leonardis, Aleš; Ricci, Elisa; Roth, Stefan; Russakovsky, Olga; Sattler, Torsten; Varol, Gül (Ed.): Computer Vision – ECCV 2024, vol. 15138, pp. 1–19, Springer Nature Switzerland, Cham, 2024, ISBN: 978-3-031-72988-1 978-3-031-72989-8, (Series Title: Lecture Notes in Computer Science).

Links | BibTeX | Tags:

Chen, Gonglin; Wu, Jinsen; Chen, Haiwei; Teng, Wenbin; Gao, Zhiyuan; Feng, Andrew; Qin, Rongjun; Zhao, Yajie

Geometry-aware Feature Matching for Large-Scale Structure from Motion Miscellaneous

2024, (Version Number: 3).

Abstract | Links | BibTeX | Tags: DTIC

Hale, James; Schweitzer, Lindsey; Gratch, Jonathan

Pitfalls of Embodiment in Human-Agent Experiment Design Proceedings Article

In: Proceedings of the ACM International Conference on Intelligent Virtual Agents, pp. 1–9, ACM, GLASGOW United Kingdom, 2024, ISBN: 979-8-4007-0625-7.

Links | BibTeX | Tags: DTIC

Gao, Zhiyuan; Teng, Wenbin; Chen, Gonglin; Wu, Jinsen; Xu, Ningli; Qin, Rongjun; Feng, Andrew; Zhao, Yajie

Skyeyes: Ground Roaming using Aerial View Images Miscellaneous

2024, (Version Number: 1).

Abstract | Links | BibTeX | Tags: DTIC

Hale, James; Schweitzer, Lindsey; Gratch, Jonathan

Integration of LLMs with Virtual Character Embodiment Proceedings Article

In: Proceedings of the ACM International Conference on Intelligent Virtual Agents, pp. 1–3, ACM, GLASGOW United Kingdom, 2024, ISBN: 979-8-4007-0625-7.

Links | BibTeX | Tags:

Georgila, Kallirroi

Comparing Pre-Trained Embeddings and Domain-Independent Features for Regression-Based Evaluation of Task-Oriented Dialogue Systems Proceedings Article

In: Proceedings of the 25th Annual Meeting of the Special Interest Group on Discourse and Dialogue, pp. 610–623, Association for Computational Linguistics, Kyoto, Japan, 2024.

Links | BibTeX | Tags: Dialogue, DTIC, Natural Language

Wang, Changzhao; Aguilar, Stephen J.; Bankard, Jennifer S.; Bui, Eric; Nye, Benjamin

Writing with AI: What College Students Learned from Utilizing ChatGPT for a Writing Assignment Journal Article

In: Education Sciences, vol. 14, no. 9, pp. 976, 2024, ISSN: 2227-7102, (Publisher: MDPI AG).

Abstract | Links | BibTeX | Tags: Learning Sciences

Lucas, Gale M.; Becerik-Gerber, Burcin; Roll, Shawn C.

Calibrating workers’ trust in intelligent automated systems Journal Article

In: Patterns, vol. 5, no. 9, pp. 101045, 2024, ISSN: 2666-3899, (Publisher: Elsevier BV).

Links | BibTeX | Tags: DTIC

Liu, Xiao; Lei, Xuanyu; Wang, Shengyuan; Huang, Yue; Feng, Zhuoer; Wen, Bosi; Cheng, Jiale; Ke, Pei; Xu, Yifan; Tam, Weng Lam; Zhang, Xiaohan; Sun, Lichao; Gu, Xiaotao; Wang, Hongning; Zhang, Jing; Huang, Minlie; Dong, Yuxiao; Tang, Jie

AlignBench: Benchmarking Chinese Alignment of Large Language Models Miscellaneous

2024, (arXiv:2311.18743 [cs]).

Abstract | Links | BibTeX | Tags: Machine Learning

Fischer, Katrin; Velentza, Anna-Maria; Lucas, Gale; Williams, Dmitri

Seeing Eye to Eye with Robots: An Experimental Study Predicting Trust in Social Robots for Domestic Use Proceedings Article

In: 2024 33rd IEEE International Conference on Robot and Human Interactive Communication (ROMAN), pp. 2162–2168, IEEE, Pasadena, CA, USA, 2024, ISBN: 979-8-3503-7502-2.

Links | BibTeX | Tags: DTIC, Virtual Humans

Zaizar, Eric D.; Gramlich, Michael A.; Rizzo, Albert “Skip”; Reger, Greg M.; Norr, Aaron M.

Exploration of the impact of baseline clinician learner characteristics on motivational interviewing skill improvement following training with a virtual standardized patient. Journal Article

In: Training and Education in Professional Psychology, 2024, ISSN: 1931-3926, 1931-3918.

Links | BibTeX | Tags: Virtual Humans

Bodner, Ehud; Mikulincer, Mario; McMahon, Elizabeth; Rizzo, Albert

Reviving life that has ceased on October the 7th: an attachment perspective on a virtual reality intervention Journal Article

In: Front. Virtual Real., vol. 5, pp. 1438663, 2024, ISSN: 2673-4192.

Abstract | Links | BibTeX | Tags: MedVR

@article{bodner_reviving_2024,

title = {Reviving life that has ceased on October the 7th: an attachment perspective on a virtual reality intervention},

author = {Ehud Bodner and Mario Mikulincer and Elizabeth McMahon and Albert Rizzo},

url = {https://www.frontiersin.org/articles/10.3389/frvir.2024.1438663/full},

doi = {10.3389/frvir.2024.1438663},

issn = {2673-4192},

year  = {2024},

date = {2024-08-01},

urldate = {2024-08-15},

journal = {Front. Virtual Real.},

volume = {5},

pages = {1438663},

abstract = {Unfortunately, in recent years, wars have forced many civilians to evacuate their homes and move to safe zones. The event of October the seventh that took place in many Kibbutzim near the Gaza strip, exposed families who were on a Jewish holiday, to the murder of family and community members. They had to leave their burned houses and move to hotels and apartment buildings in other parts of Israel. Many people, also from the Northen parts of the country, are still in new safe zones, and have huge difficulties in returning to their houses (and not only because of objective security reasons). In this “perspective” article we propose a Virtual Reality (VR) application, which is based on past and current research in the fields of attachment theory and traumatic grief. We propose that in addition to the use of exposure therapy, a VR simulation which will activate the attachment system, can reorganize the evacuees’ figure and place attachment representations. We suggest that such a simulation will revive the evacuees’ sense of safe-haven and secure base and enable them to return to their home place, or to adjust to a new place, thereby leading to optimal adjustment. We start with a presentation of the theory of attachment, place attachment, attachment and loss and the two-track model of bereavement. Then, we describe the design of our VR intervention that aims to address this challenge from the attachment theory perspective with the evacuees. Finally, we discuss the challenges that need to be dealt with to implement the VR interventions through resilience centers in Israel.},

keywords = {MedVR},

pubstate = {published},

tppubtype = {article}

}

Han, Bin; Yau, Cleo; Lei, Su; Gratch, Jonathan

Knowledge-based Emotion Recognition using Large Language Models Miscellaneous

2024, (arXiv:2408.04123 [cs]).

Abstract | Links | BibTeX | Tags: DTIC, Emotions

Parga, Madeline R.; Roll, Shawn C.; Lucas, Gale M.; Becerik-Gerber, Burcin; Naranayan, Shrikanth

Differences in Self-Rated Worker Outcomes Across Stress States: An Interim Analysis of Hybrid Worker Data Journal Article

In: Proceedings of the Human Factors and Ergonomics Society Annual Meeting, 2024, ISSN: 1071-1813, 2169-5067, (Publisher: SAGE Publications).

Abstract | Links | BibTeX | Tags:

Tak, Ala N.; Gratch, Jonathan

GPT-4 Emulates Average-Human Emotional Cognition from a Third-Person Perspective Miscellaneous

2024, (arXiv:2408.13718 [cs]).

Abstract | Links | BibTeX | Tags: DTIC, Emotions

Roth, Holger R.; Beutel, Daniel J.; Cheng, Yan; Marques, Javier Fernandez; Pan, Heng; Chen, Chester; Zhang, Zhihong; Wen, Yuhong; Yang, Sean; Isaac,; Yang,; Hsieh, Yuan-Ting; Xu, Ziyue; Xu, Daguang; Lane, Nicholas D.; Feng, Andrew

Supercharging Federated Learning with Flower and NVIDIA FLARE Miscellaneous

2024, (arXiv:2407.00031 [cs]).

Abstract | Links | BibTeX | Tags:

Diaz-Pinto, Andres; Alle, Sachidanand; Nath, Vishwesh; Tang, Yucheng; Ihsani, Alvin; Asad, Muhammad; Pérez-García, Fernando; Mehta, Pritesh; Li, Wenqi; Flores, Mona; Roth, Holger R.; Vercauteren, Tom; Xu, Daguang; Dogra, Prerna; Ourselin, Sebastien; Feng, Andrew; Cardoso, M. Jorge

MONAI Label: A framework for AI-assisted interactive labeling of 3D medical images Journal Article

In: Medical Image Analysis, vol. 95, pp. 103207, 2024, ISSN: 13618415.

Links | BibTeX | Tags: MedVR

Huang, Shuo; Jones, Fred; Gurney, Nikolos; Pynadath, David; Srivastava, Kunal; Trent, Stoney; Wu, Peggy; Zhu, Quanyan

PsybORG+: Modeling and Simulation for Detecting Cognitive Biases in Advanced Persistent Threats Miscellaneous

2024, (Version Number: 3).

Abstract | Links | BibTeX | Tags: DTIC

Owayyed, Mohammed Al; Tielman, Myrthe; Hartholt, Arno; Specht, Marcus; Brinkman, Willem-Paul

Agent-based social skills training systems: the ARTES architecture, interaction characteristics, learning theories and future outlooks Journal Article

In: Behaviour & Information Technology, pp. 1–28, 2024, ISSN: 0144-929X, 1362-3001.

Links | BibTeX | Tags: Virtual Agents, Virtual Humans

Bell, Imogen H.; Pot-Kolder, Roos; Rizzo, Albert; Rus-Calafell, Mar; Cardi, Valentina; Cella, Matteo; Ward, Thomas; Riches, Simon; Reinoso, Martin; Thompson, Andrew; Alvarez-Jimenez, Mario; Valmaggia, Lucia

Advances in the use of virtual reality to treat mental health conditions Journal Article

In: Nat Rev Psychol, 2024, ISSN: 2731-0574.

Links | BibTeX | Tags: MedVR

Gunasekara, Chulaka; Kim, Seokhwan; D'Haro, Luis Fernando; Rastogi, Abhinav; Chen, Yun-Nung; Eric, Mihail; Hedayatnia, Behnam; Gopalakrishnan, Karthik; Liu, Yang; Huang, Chao-Wei; Hakkani-Tür, Dilek; Li, Jinchao; Zhu, Qi; Luo, Lingxiao; Liden, Lars; Huang, Kaili; Shayandeh, Shahin; Liang, Runze; Peng, Baolin; Zhang, Zheng; Shukla, Swadheen; Huang, Minlie; Gao, Jianfeng; Mehri, Shikib; Feng, Yulan; Gordon, Carla; Alavi, Seyed Hossein; Traum, David; Eskenazi, Maxine; Beirami, Ahmad; Cho, Eunjoon; Crook, Paul A.; De, Ankita; Geramifard, Alborz; Kottur, Satwik; Moon, Seungwhan; Poddar, Shivani; Subba, Rajen

Overview of the Ninth Dialog System Technology Challenge: DSTC9 Journal Article

In: IEEE/ACM Trans. Audio Speech Lang. Process., pp. 1–10, 2024, ISSN: 2329-9290, 2329-9304.

Links | BibTeX | Tags: Natural Language

Han, Bin; Yau, Cleo; Lei, Su; Gratch, Jonathan

In-Depth Analysis of Emotion Recognition through Knowledge-Based Large Language Models Miscellaneous

2024, (arXiv:2408.00780 [cs]).

Abstract | Links | BibTeX | Tags: Virtual Humans

Xiao, Hanyuan; Chen, Yingshu; Huang, Huajian; Xiong, Haolin; Yang, Jing; Prasad, Pratusha; Zhao, Yajie

Localized Gaussian Splatting Editing with Contextual Awareness Miscellaneous

2024, (arXiv:2408.00083 [cs]).

Abstract | Links | BibTeX | Tags: DTIC, VGL

@misc{xiao_localized_2024,

title = {Localized Gaussian Splatting Editing with Contextual Awareness},

author = {Hanyuan Xiao and Yingshu Chen and Huajian Huang and Haolin Xiong and Jing Yang and Pratusha Prasad and Yajie Zhao},

url = {http://arxiv.org/abs/2408.00083},

year  = {2024},

date = {2024-07-01},

urldate = {2024-08-16},

publisher = {arXiv},

abstract = {Recent text-guided generation of individual 3D object has achieved great success using diffusion priors. However, these methods are not suitable for object insertion and replacement tasks as they do not consider the background, leading to illumination mismatches within the environment. To bridge the gap, we introduce an illumination-aware 3D scene editing pipeline for 3D Gaussian Splatting (3DGS) representation. Our key observation is that inpainting by the state-of-the-art conditional 2D diffusion model is consistent with background in lighting. To leverage the prior knowledge from the well-trained diffusion models for 3D object generation, our approach employs a coarse-to-fine objection optimization pipeline with inpainted views. In the first coarse step, we achieve image-to-3D lifting given an ideal inpainted view. The process employs 3D-aware diffusion prior from a view-conditioned diffusion model, which preserves illumination present in the conditioning image. To acquire an ideal inpainted image, we introduce an Anchor View Proposal (AVP) algorithm to find a single view that best represents the scene illumination in target region. In the second Texture Enhancement step, we introduce a novel Depth-guided Inpainting Score Distillation Sampling (DI-SDS), which enhances geometry and texture details with the inpainting diffusion prior, beyond the scope of the 3D-aware diffusion prior knowledge in the first coarse step. DI-SDS not only provides fine-grained texture enhancement, but also urges optimization to respect scene lighting. Our approach efficiently achieves local editing with global illumination consistency without explicitly modeling light transport. We demonstrate robustness of our method by evaluating editing in real scenes containing explicit highlight and shadows, and compare against the state-of-the-art text-to-3D editing methods.},

note = {arXiv:2408.00083 [cs]},

keywords = {DTIC, VGL},

pubstate = {published},

tppubtype = {misc}

}

Liu, Ruying; Wu, Wanjing; Becerik-Gerber, Burcin; Lucas, Gale M.

Enhancing Building Safety Design for Active Shooter Incidents: Exploration of Building Exit Parameters using Reinforcement Learning-Based Simulations Miscellaneous

2024, (arXiv:2407.10441 [cs]).

Abstract | Links | BibTeX | Tags: DTIC, Virtual Worlds

Ke, Pei; Wen, Bosi; Feng, Andrew; Liu, Xiao; Lei, Xuanyu; Cheng, Jiale; Wang, Shengyuan; Zeng, Aohan; Dong, Yuxiao; Wang, Hongning; Tang, Jie; Huang, Minlie

CritiqueLLM: Towards an Informative Critique Generation Model for Evaluation of Large Language Model Generation Proceedings Article

In: Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 13034–13054, Association for Computational Linguistics, Bangkok, Thailand, 2024.

Links | BibTeX | Tags: Natural Language

Lu, Shuhong; Jin, Zhangyu; Rajendran, Vickram; Harari, Michal; Feng, Andrew; Melo, Celso M. De

Synthetic-to-real adaptation for complex action recognition in surveillance applications Proceedings Article

In: Manser, Kimberly E.; Melo, Celso De; Rao, Raghuveer M.; Howell, Christopher L. (Ed.): Synthetic Data for Artificial Intelligence and Machine Learning: Tools, Techniques, and Applications II, pp. 14, SPIE, National Harbor, United States, 2024, ISBN: 978-1-5106-7388-5 978-1-5106-7389-2.

Links | BibTeX | Tags: DTIC

Nurunnabi, Abdul; Teferle, Felicia; Laefer, Debra F.; Chen, Meida; Ali, Mir Masoom

Development of a Precise Tree Structure from LiDAR Point Clouds Journal Article

In: Int. Arch. Photogramm. Remote Sens. Spatial Inf. Sci., vol. XLVIII-2-2024, pp. 301–308, 2024, ISSN: 2194-9034.

Abstract | Links | BibTeX | Tags: Narrative, VGL

@article{nurunnabi_development_2024,

title = {Development of a Precise Tree Structure from LiDAR Point Clouds},

author = {Abdul Nurunnabi and Felicia Teferle and Debra F. Laefer and Meida Chen and Mir Masoom Ali},

url = {https://isprs-archives.copernicus.org/articles/XLVIII-2-2024/301/2024/},

doi = {10.5194/isprs-archives-XLVIII-2-2024-301-2024},

issn = {2194-9034},

year  = {2024},

date = {2024-06-01},

urldate = {2024-07-11},

journal = {Int. Arch. Photogramm. Remote Sens. Spatial Inf. Sci.},

volume = {XLVIII-2-2024},

pages = {301–308},

abstract = {Abstract. A precise tree structure that represents the distribution of tree stem, branches, and leaves is crucial for accurately capturing the full representation of a tree. Light Detection and Ranging (LiDAR)-based three-dimensional (3D) point clouds (PCs) capture the geometry of scanned objects including forests stands and individual trees. PCs are irregular, unstructured, often noisy, and contaminated by outliers. Researchers have struggled to develop methods to separate leaves and wood without losing the tree geometry. This paper proposes a solution that employs only the spatial coordinates (x, y, z) of the PC. The new algorithm works as a filtering approach, utilizing multi-scale neighborhood-based geometric features (GFs) e.g., linearity, planarity, and verticality to classify linear (wood) and non-linear (leaf) points. This involves finding potential wood points and coupling them with an octree-based segmentation to develop a tree architecture. The main contributions of this paper are (i) investigating the potential of different GFs to split linear and non-linear points, (ii) introducing a novel method that pointwise classifies leaf and wood points, and (iii) developing a precise 3D tree structure. The performance of the new algorithm has been demonstrated through terrestrial laser scanning PCs. For a Scots pine tree, the new method classifies leaf and wood points with an overall accuracy of 97.9%.},

keywords = {Narrative, VGL},

pubstate = {published},

tppubtype = {article}

}

Zhang, Mingyuan; Cai, Zhongang; Pan, Liang; Hong, Fangzhou; Guo, Xinying; Yang, Lei; Liu, Ziwei

MotionDiffuse: Text-Driven Human Motion Generation With Diffusion Model Journal Article

In: IEEE Trans. Pattern Anal. Mach. Intell., vol. 46, no. 6, pp. 4115–4128, 2024, ISSN: 0162-8828, 2160-9292, 1939-3539.

Links | BibTeX | Tags: VGL

Yin, Yinxuan; Nayyar, Mollik; Holman, Daniel; Lucas, Gale; Holbrook, Colin; Wagner, Alan

Validation and Evacuee Modeling of Virtual Robot-guided Emergency Evacuation Experiments Miscellaneous

2024.

Abstract | Links | BibTeX | Tags: DTIC, Virtual Humans

Saxon, Leslie; Faulk, Robert T; Boberg, Jill; Barrett, Trevor; McLelland, Steve

Continuous Assessment of Active-Duty Army Special Operations and Reconnaissance Marines Using Digital Devices and Custom Software: The Digital Comprehensive Operator Readiness Assessment (DcORA) Study Journal Article

In: J. Spec. Oper. Med., 2024, ISSN: 1553-9768.

Links | BibTeX | Tags: CBC, DTIC

Greenwald, Eric; Krakowski, Ari; Hurt, Timothy; Grindstaff, Kelly; Wang, Ning

It's like I'm the AI: Youth Sensemaking About AI through Metacognitive Embodiment Proceedings Article

In: Proceedings of the 23rd Annual ACM Interaction Design and Children Conference, pp. 789–793, ACM, Delft Netherlands, 2024, ISBN: 979-8-4007-0442-0.

Links | BibTeX | Tags: AI, Machine Learning

Chen, Meida; Lal, Devashish; Yu, Zifan; Xu, Jiuyi; Feng, Andrew; You, Suya; Nurunnabi, Abdul; Shi, Yangming

Large-Scale 3D Terrain Reconstruction Using 3D Gaussian Splatting for Visualization and Simulation Journal Article

In: Int. Arch. Photogramm. Remote Sens. Spatial Inf. Sci., vol. XLVIII-2-2024, pp. 49–54, 2024, ISSN: 2194-9034.

Abstract | Links | BibTeX | Tags: DTIC, Graphics, VGL

Nye, Benjamin D.; Core, Mark G.; Chereddy, Sai V. R.; Young, Vivian; Auerbach, Daniel

Bootstrapping Assessments for Team Simulations: Transfer Learning Between First-Person-Shooter Game Maps Book Section

In: Sottilare, Robert A.; Schwarz, Jessica (Ed.): Adaptive Instructional Systems, vol. 14727, pp. 261–271, Springer Nature Switzerland, Cham, 2024, ISBN: 978-3-031-60608-3 978-3-031-60609-0, (Series Title: Lecture Notes in Computer Science).

Links | BibTeX | Tags: DTIC, Learning Sciences, Machine Learning, UARC

Core, Mark G.; Nye, Benjamin D.; Fegley, Brent D.

Trend-Aware Scenario Authoring: Adapting Training Toward Patterns from Real Operations Book Section

In: Sottilare, Robert A.; Schwarz, Jessica (Ed.): Adaptive Instructional Systems, vol. 14727, pp. 15–24, Springer Nature Switzerland, Cham, 2024, ISBN: 978-3-031-60608-3 978-3-031-60609-0, (Series Title: Lecture Notes in Computer Science).

Links | BibTeX | Tags: DTIC, Learning Sciences, UARC

Artstein, Ron; Chen, Elizabeth

Augmenting Training Data for a Virtual Character Using GPT-3.5 Proceedings Article

In: Tyhe Florida Artificial Intelligence Research Society, 2024.

Abstract | Links | BibTeX | Tags: Dialogue, DTIC, Natural Language

Bohy, Hugo; Tran, Minh; Haddad, Kevin El; Dutoit, Thierry; Soleymani, Mohammad

Social-MAE: A Transformer-Based Multimodal Autoencoder for Face and Voice Proceedings Article

In: 2024 IEEE 18th International Conference on Automatic Face and Gesture Recognition (FG), pp. 1–5, IEEE, Istanbul, Turkiye, 2024, ISBN: 979-8-3503-9494-8.

Links | BibTeX | Tags:

Liu, Rong; Xu, Rui; Hu, Yue; Chen, Meida; Feng, Andrew

AtomGS: Atomizing Gaussian Splatting for High-Fidelity Radiance Field Miscellaneous

2024, (Version Number: 2).

Abstract | Links | BibTeX | Tags: Graphics, VGL

Chang, Di; Shi, Yichun; Gao, Quankai; Fu, Jessica; Xu, Hongyi; Song, Guoxian; Yan, Qing; Zhu, Yizhe; Yang, Xiao; Soleymani, Mohammad

MagicPose: Realistic Human Poses and Facial Expressions Retargeting with Identity-aware Diffusion Miscellaneous

2024, (arXiv:2311.12052 [cs]).

Abstract | Links | BibTeX | Tags:

Koresh, Caleb; Ustun, Volkan; Kumar, Rajay; Aris, Tim

Improving Reinforcement Learning Experiments in Unity through Waypoint Utilization Journal Article

In: FLAIRS, vol. 37, 2024, ISSN: 2334-0762.

Abstract | Links | BibTeX | Tags: Machine Learning

Aris, Timothy; Ustun, Volkan; Kumar, Rajay

Training Reinforcement Learning Agents to React to an Ambush for Military Simulations Journal Article

In: FLAIRS, vol. 37, 2024, ISSN: 2334-0762.

Abstract | Links | BibTeX | Tags: Simulation, VR

Liu, Lixing; Ustun, Volkan; Kumar, Rajay

Leveraging Organizational Hierarchy to Simplify Reward Design in Cooperative Multi-agent Reinforcement Learning Journal Article

In: FLAIRS, vol. 37, 2024, ISSN: 2334-0762.

Abstract | Links | BibTeX | Tags: Machine Learning

Lukin, Stephanie M; Bonial, Claire; Marge, Matthew; Hudson, Taylor; Hayes, Cory J.; Pollard, Kimberly; Baker, Anthony L.; Foots, Ashley; Artstein, Ron; Gervits, Felix; Abrams, Mitchell; Cassidy, Henry; Donatelli, Lucia; Leuski, Anton; Hill, Susan G.; Traum, David; Voss, Clare

SCOUT: A Situated and Multi-Modal Human-Robot Dialogue Corpus Journal Article

In: pp. 14445 - 144458, 2024.

Abstract | Links | BibTeX | Tags:

West, Taylor Nicole; Prinzing, Michael; Garton, Catherine; Berman, Catherine J.; Zhou, Jieni; Hale, James; Gratch, Jonathan; Fredrickson, Barbara

Improving Social Connection with Weak Ties and Strangers: Effects of a New Micro-Intervention on Interaction Quality and Social Behavior Miscellaneous

2024.

Abstract | Links | BibTeX | Tags: Emotions, Virtual Humans

Zhang, Hao; Chang, Di; Li, Fang; Soleymani, Mohammad; Ahuja, Narendra

MagicPose4D: Crafting Articulated Models with Appearance and Motion Control Miscellaneous

2024, (Version Number: 1).

Abstract | Links | BibTeX | Tags: VGL, Virtual Humans

@misc{zhang_magicpose4d_2024,

title = {MagicPose4D: Crafting Articulated Models with Appearance and Motion Control},

author = {Hao Zhang and Di Chang and Fang Li and Mohammad Soleymani and Narendra Ahuja},

url = {https://arxiv.org/abs/2405.14017},

doi = {10.48550/ARXIV.2405.14017},

year  = {2024},

date = {2024-05-01},

urldate = {2024-06-25},

publisher = {arXiv},

abstract = {With the success of 2D and 3D visual generative models, there is growing interest in generating 4D content. Existing methods primarily rely on text prompts to produce 4D content, but they often fall short of accurately defining complex or rare motions. To address this limitation, we propose MagicPose4D, a novel framework for refined control over both appearance and motion in 4D generation. Unlike traditional methods, MagicPose4D accepts monocular videos as motion prompts, enabling precise and customizable motion generation. MagicPose4D comprises two key modules: 

 i) Dual-Phase 4D Reconstruction Modulevphantom which operates in two phases. The first phase focuses on capturing the model's shape using accurate 2D supervision and less accurate but geometrically informative 3D pseudo-supervision without imposing skeleton constraints. The second phase refines the model using more accurate pseudo-3D supervision, obtained in the first phase and introduces kinematic chain-based skeleton constraints to ensure physical plausibility. Additionally, we propose a Global-local Chamfer loss that aligns the overall distribution of predicted mesh vertices with the supervision while maintaining part-level alignment without extra annotations. 

 ii) Cross-category Motion Transfer Modulevphantom leverages the predictions from the 4D reconstruction module and uses a kinematic-chain-based skeleton to achieve cross-category motion transfer. It ensures smooth transitions between frames through dynamic rigidity, facilitating robust generalization without additional training. 

 Through extensive experiments, we demonstrate that MagicPose4D significantly improves the accuracy and consistency of 4D content generation, outperforming existing methods in various benchmarks.},

note = {Version Number: 1},

keywords = {VGL, Virtual Humans},

pubstate = {published},

tppubtype = {misc}

}

2148 entries « ‹ 2 of 43 › »