@article{discovery10128881,
            year = {2021},
           month = {September},
          volume = {41},
         journal = {Journal of Building Engineering},
           title = {A review of data-driven building performance analysis and design on big on-site building performance data},
            note = {This version is the author accepted manuscript. For information on re-use, please refer to the publisher's terms and conditions.},
       publisher = {Elsevier BV},
          author = {Tian, Z and Zhang, X and Wei, S and Du, S and Shi, X},
             url = {https://doi.org/10.1016/j.jobe.2021.102706},
        abstract = {Building performance design (BPD) is a crucial pathway to achieve high-performance buildings. Previous simulation-based BPD is being questioned due to the performance gaps between simulated and measured values. In recent years, accumulated on-site building performance data (OBPD) make it possible to analyze and design buildings with data-driven methods. This article makes a review of previous studies that conducted data-driven building performance analysis and design on a large amount of OBPD. The covered studies are summarized by the applied techniques, i.e., statistics, regression, classification, and clustering. The data used by these studies are compared and discussed emphasizing the data size and public availability. A comprehensive discussion is given about the achievements of existing studies, and challenges for boosting data-driven BPD from three aspects, i.e., developing data-driven models, the availability of building performance data, and stimulation of industrial practices. The review results indicate that data-driven methods were commonly applied to estimate energy consumptions, and explore energy trends, determinant features, and reference buildings. Identifying determinant features is one of the most successful applications. This study highlights the future research gaps for boosting data-driven building performance design.},
        keywords = {Building performance design, data-driven, building energy, building performance data}
}