@ARTICLE{10.3389/fmars.2022.869088, AUTHOR={Le, Kevin T. and Yuan, Zhouyuan and Syed, Areeb and Ratelle, Devin and Orenstein, Eric C. and Carter, Melissa L. and Strang, Sarah and Kenitz, Kasia M. and Morgado, Pedro and Franks, Peter J. S. and Vasconcelos, Nuno and Jaffe, Jules S.}, TITLE={Benchmarking and Automating the Image Recognition Capability of an In Situ Plankton Imaging System}, JOURNAL={Frontiers in Marine Science}, VOLUME={9}, YEAR={2022}, URL={https://www.frontiersin.org/article/10.3389/fmars.2022.869088}, DOI={10.3389/fmars.2022.869088}, ISSN={2296-7745}, ABSTRACT={To understand ocean health, it is crucial to monitor photosynthetic marine plankton – the microorganisms that form the base of the marine food web and are responsible for the uptake of atmospheric carbon. With the recent development of in situ microscopes that can acquire vast numbers of images of these organisms, the use of deep learning methods to taxonomically identify them has come to the forefront. Given this, two questions arise: 1) How well do deep learning methods such as Convolutional Neural Networks (CNNs) identify these marine organisms using data from in situ microscopes? 2) How well do CNN-derived estimates of abundance agree with established net and bottle-based sampling? Here, using images collected by the in situ Scripps Plankton Camera (SPC) system, we trained a CNN to recognize 9 species of phytoplankton, some of which are associated with Harmful Algal Blooms (HABs). The CNNs evaluated on 26 independent natural samples collected at Scripps Pier achieved an averaged accuracy of 92%, with 7 of 10 target categories above 85%. To compare abundance estimates, we fit a linear model between the number of organisms of each species counted in a known volume in the lab, with the number of organisms collected by the in situ microscope sampling at the same time. The linear fit between lab and in situ counts of several of the most abundant key HAB species suggests that, in the case of dinoflagellates, there is good correspondence between the two methods. As one advantage of our method, given the excellent correlation between lab counts and in situ microscope counts for key species, the methodology proposed here provides a way to estimate an equivalent volume in which the employed microscope can identify in-focus organisms and obtain statistically robust estimates of abundance.} }