@inproceedings{7d47ae93cbdf429584924d41a8b5d842,
title = "Facilitating feature selection and extraction in clinical trials with large language models",
abstract = "Research on clinical trials requires substantial background and technical knowledge. Large language models (LLMs) have already made a significant impact in various fields. We attempted to use general-purpose LLMs to assist newcomers in clinical trials, enabling them to quickly begin their work. In our work, we demonstrated that in the domain of clinical trials, the current cutting-edge LLMs can provide excellent recommendations for feature selection. By utilizing the features suggested by LLMs, we achieved a 2.5% improvement in AUC compared to complex neural network models when using simpler algorithms. We have also demonstrated that by adjusting the prompts, LLM can play a significant role in the feature extraction process. By adjusting the prompts for certain features suggested by LLM, LLM-assisted feature extraction achieved 100% accuracy in a random sample covering approximately 10% of the entire dataset.",
keywords = "Clinical Trials, Application of LLMs, Healthcare",
author = "Jiaji Guo and Wen Sun and Shiting Wen and Di Wu and Yipeng Zhou",
year = "2025",
doi = "10.1007/978-981-96-0840-9_16",
language = "English",
isbn = "9789819608393",
series = "Lecture Notes in Computer Science",
publisher = "Springer, Springer Nature",
pages = "230--240",
editor = "Sheng, {Quan Z.} and Gill Dobbie and Jing Jiang and Xuyun Zhang and Zhang, {Wei Emma} and Yannis Manolopoulos and Jia Wu and Wathiq Mansoor and Congbo Ma",
booktitle = "Advanced Data Mining and Applications",
address = "United States",
note = "20th International Conference on Advanced Data Mining Applications, ADMA 2024 ; Conference date: 03-12-2024 Through 05-12-2024",
}