@article{wang_liu_hsiang_leming_2012, title={Causes and Penalties of Variation: Case Study of a Precast Concrete Slab Production Facility}, volume={138}, ISSN={0733-9364 1943-7862}, url={http://dx.doi.org/10.1061/(asce)co.1943-7862.0000475}, DOI={10.1061/(asce)co.1943-7862.0000475}, abstractNote={Concrete precast plants require strict control over and adherence to the timing and sequence of operations. Variation for this research is divided into the variation in task starting time (the difference between the planned and the actual starting time) and the variation in task duration (the difference between the planned and the actual task duration). This study determined causes of variation in task starting time and duration of precast concrete slab production tasks. It also identified penalties associated with not reducing variation, which include an increase in project duration, Work in-Progress (WIP) and cost and a decrease in labor productivity. Additionally, two execution policies (keeping laborers waiting before preconditions are ready and keeping laborers busy) in the face of variation were compared by using STROBOSCOPE simulation techniques. It was found that simply keeping workers busy is insufficient for managing variation. Management effort should be devoted to eliminate causes of variation in the planning stage to make a reliable work plan. The results will help prefabricators to understand causes and penalties of variation, which is the starting point of attacking and reducing it. Although this study is based on a concrete slab production facility, this research can have a broader effect on the construction industry because the research method and simulation models developed in this study are applicable to other fabrication processes as well.}, number={6}, journal={Journal of Construction Engineering and Management}, publisher={American Society of Civil Engineers (ASCE)}, author={Wang, Chao and Liu, Min and Hsiang, Simon M. and Leming, Michael L.}, year={2012}, month={Jun}, pages={775–785} } @article{yuan_wang_skibniewski_li_2012, title={Developing Key Performance Indicators for Public-Private Partnership Projects: Questionnaire Survey and Analysis}, volume={28}, ISSN={["1943-5479"]}, DOI={10.1061/(asce)me.1943-5479.0000113}, abstractNote={AbstractPublic-private partnerships (PPPs) are increasing in popularity. Major challenges in the development of PPPs have resulted from the global financial crisis. However, with respect to their monetary value, PPPs are still an attractive option for public sector projects. Performance management and measurement, in which Key Performance Indicators (KPIs) are the core elements, viewed as effective methods to help PPPs deliver value for money. This article describes in greater detail a KPI conceptual model composed of 5 performance packages and 48 indicators developed by the authors in previous studies. A structured questionnaire survey explored PPP stakeholders perceptions of 48 project performance indicators (PIs) to identify actual KPIs for performance management and measurement in PPPs. Although the survey results show that all PIs are important, performance packages contribute differently to the overall project performance. A confirmatory factor analysis (CFA) was used to test whether the proposed co...}, number={3}, journal={JOURNAL OF MANAGEMENT IN ENGINEERING}, author={Yuan, Jingfeng and Wang, Chao and Skibniewski, Miroslaw J. and Li, Qiming}, year={2012}, month={Jul}, pages={252–264} } @article{wang_mueller_engelmann_scott_2012, title={Proactive process-level live migration and back migration in HPC environments}, volume={72}, ISSN={["1096-0848"]}, DOI={10.1016/j.jpdc.2011.10.009}, abstractNote={As the number of nodes in high-performance computing environments keeps increasing, faults are becoming common place. Reactive fault tolerance (FT) often does not scale due to massive I/O requirements and relies on manual job resubmission. This work complements reactive with proactive FT at the process level. Through health monitoring, a subset of node failures can be anticipated when one’s health deteriorates. A novel process-level live migration mechanism supports continued execution of applications during much of process migration. This scheme is integrated into an MPI execution environment to transparently sustain health-inflicted node failures, which eradicates the need to restart and requeue MPI jobs. Experiments indicate that 1–6.5 s of prior warning are required to successfully trigger live process migration while similar operating system virtualization mechanisms require 13–24 s. This self-healing approach complements reactive FT by nearly cutting the number of checkpoints in half when 70% of the faults are handled proactively. The work also provides a novel back migration approach to eliminate load imbalance or bottlenecks caused by migrated tasks. Experiments indicate the larger the amount of outstanding execution, the higher the benefit due to back migration.}, number={2}, journal={JOURNAL OF PARALLEL AND DISTRIBUTED COMPUTING}, author={Wang, Chao and Mueller, Frank and Engelmann, Christian and Scott, Stephen L.}, year={2012}, month={Feb}, pages={254–267} } @article{scott_engelmann_vallee_naughton_tikotekar_ostrouchov_leangsuksun_naksinehaboon_nassar_paun_et al._2009, title={A Tunable Holistic Resiliency Approach for High-Performance Computing Systems}, volume={44}, ISSN={["1558-1160"]}, DOI={10.1145/1594835.1504227}, abstractNote={In order to address anticipated high failure rates, resiliency characteristics have become an urgent priority for next-generation extreme-scale high-performance computing (HPC) systems. This poster describes our past and ongoing efforts in novel fault resilience technologies for HPC. Presented work includes proactive fault resilience techniques, system and application reliability models and analyses, failure prediction, transparent process- and virtual-machine-level migration, and trade-off models for combining preemptive migration with checkpoint/restart. This poster summarizes our work and puts all individual technologies into context with a proposed holistic fault resilience framework.}, number={4}, journal={ACM SIGPLAN NOTICES}, author={Scott, Stephen L. and Engelmann, Christian and Vallee, Geoffroy R. and Naughton, Thomas and Tikotekar, Anand and Ostrouchov, George and Leangsuksun, Chokchai and Naksinehaboon, Nichamon and Nassar, Raja and Paun, Mihaela and et al.}, year={2009}, month={Apr}, pages={305–306} } @inproceedings{wang_mueller_engelmann_scott_2008, title={Proactive process-level live migration in HPC environments}, DOI={10.1109/sc.2008.5222634}, abstractNote={As the number of nodes in high-performance computing environments keeps increasing, faults are becoming common place. Reactive fault tolerance (FT) often does not scale due to massive I/O requirements and relies on manual job resubmission. This work complements reactive with proactive FT at the process level. Through health monitoring, a subset of node failures can be anticipated when one's health deteriorates. A novel process-level live migration mechanism supports continued execution of applications during much of processes migration. This scheme is integrated into an MPI execution environment to transparently sustain health-inflicted node failures, which eradicates the need to restart and requeue MPI jobs. Experiments indicate that 1-6.5 seconds of prior warning are required to successfully trigger live process migration while similar operating system virtualization mechanisms require 13-24 seconds. This self-healing approach complements reactive FT by nearly cutting the number of checkpoints in half when 70% of the faults are handled proactively.}, booktitle={International Conference for High Performance Computing, Networking, Storage and Analysis}, author={Wang, C. and Mueller, F. and Engelmann, C. and Scott, S. L.}, year={2008}, pages={126–137} }