@article{zhang_maleski_ashrafi_spencer_chu_2024, title={Open-Source High-Throughput Phenotyping for Blueberry Yield and Maturity Prediction Across Environments: Neural Network Model and Labeled Dataset for Breeders}, volume={10}, ISSN={["2311-7524"]}, url={https://doi.org/10.3390/horticulturae10121332}, DOI={10.3390/horticulturae10121332}, abstractNote={Time to maturity and yield are important traits for highbush blueberry (Vaccinium corymbosum) breeding. Proper determination of the time to maturity of blueberry varieties and breeding lines informs the harvest window, ensuring that the fruits are harvested at optimum maturity and quality. On the other hand, high-yielding crops bring in high profits per acre of planting. Harvesting and quantifying the yield for each blueberry breeding accession are labor-intensive and impractical. Instead, visual ratings as an estimation of yield are often used as a faster way to quantify the yield, which is categorical and subjective. In this study, we developed and shared a high-throughput phenotyping method using neural networks to predict blueberry time to maturity and to provide a proxy for yield, overcoming the labor constraints of obtaining high-frequency data. We aim to facilitate further research in computer vision and precision agriculture by publishing the labeled image dataset and the trained model. In this research, true-color images of blueberry bushes were collected, annotated, and used to train a deep neural network object detection model [You Only Look Once (YOLOv11)] to detect mature and immature berries. Different versions of YOLOv11 were used, including nano, small, and medium, which had similar performance, while the medium version had slightly higher metrics. The YOLOv11m model shows strong performance for the mature berry class, with a precision of 0.90 and an F1 score of 0.90. The precision and recall for detecting immature berries were 0.81 and 0.79. The model was tested on 10 blueberry bushes by hand harvesting and weighing blueberries. The results showed that the model detects approximately 25% of the berries on the bushes, and the correlation coefficients between model-detected and hand-harvested traits were 0.66, 0.86, and 0.72 for mature fruit count, immature fruit count, and mature ratio, respectively. The model applied to 91 blueberry advance selections and categorized them into groups with diverse levels of maturity and productivity using principal component analysis (PCA). These results inform the harvest window and yield of these breeding lines with precision and objectivity through berry classification and quantification. This model will be helpful for blueberry breeders, enabling more efficient selection, and for growers, helping them accurately estimate optimal harvest windows. This open-source tool can potentially enhance research capabilities and agricultural productivity.}, number={12}, journal={HORTICULTURAE}, author={Zhang, Jing and Maleski, Jerome and Ashrafi, Hudson and Spencer, Jessica A. and Chu, Ye}, year={2024}, month={Dec} }