Citation

BibTex format

@inproceedings{Zuo:2025,
author = {Zuo, H and Yin, Y and Hazeri, K and Wang, B and Jennings, T and Buhagiar, J and Cartwright, B and Liu, R and Childs, P},
pages = {98--103},
publisher = {The University of Salford},
title = {Automating operations and maintenance manual data extraction for retrofit applications: assessing GPT-4o’s performance and challenges},
year = {2025}
}

RIS format (EndNote, RefMan)

TY  - CPAPER
AB - Operations & Maintenance (O&M) manuals contain data that is essential to understand ahead of building retrofits. However, their unstructured format makes information retrieval time-consuming and error-prone. This study evaluates GPT-4o’s ability to extract information from O&M manuals, assessing accuracy in text extraction, categorization, and numerical data handling. Structured extraction steps and prompt strategies were developed based on industry needs. The extraction performance was compared to human-extracted data based on a dataset of 60 O&M manuals, using quantitative and qualitative evaluation. Results form the study show that text-based extraction is reliable, particularly for component names, types, and manufacturer details, where formatting differences had little impact on accuracy. However, challenges appeared in fields requiring categorization, numerical interpretation, and structured mapping. One issue was category misalignment, where GPT-4o could assign components to broad categories but had difficulty with domain-specific classifications that require specialized knowledge. This inconsistency suggests that rule-based constraints or further adjustments may be needed to improve standardization in retrofit applications. Another challenge was the model’s handling of numerical data. Mistakes occurred in quantity extraction, page numbering, and location references, where the model miscalculated totals, misread measurement units, or mismatched printed and digital page numbers. These errors suggest that GPT-4o lacks a way to process numerical information in context, meaning manual checks are still required for numerical fields. These findings highlight GPT-4o’s potential to automate O&M data extraction, reducing manual effort and speeding up the retrofit process.
AU - Zuo,H
AU - Yin,Y
AU - Hazeri,K
AU - Wang,B
AU - Jennings,T
AU - Buhagiar,J
AU - Cartwright,B
AU - Liu,R
AU - Childs,P
EP - 103
PB - The University of Salford
PY - 2025///
SP - 98
TI - Automating operations and maintenance manual data extraction for retrofit applications: assessing GPT-4o’s performance and challenges
ER -