@article {zevin2023gravity, title = {Gravity Spy: Lessons Learned and a Path Forward}, journal = {European Physical Journal Plus}, volume = {139}, year = {2024}, month = {01/2024}, pages = {Article 100}, abstract = {

The Gravity Spy project aims to uncover the origins of glitches, transient bursts of noise that hamper analysis of gravitational-wave data. By using both the work of citizen-science volunteers and machine-learning algorithms, the Gravity Spy project enables reliable classification of glitches. Citizen science and machine learning are intrinsically coupled within the Gravity Spy framework, with machine-learning classifications providing a rapid first-pass classification of the dataset and enabling tiered volunteer training, and volunteer-based classifications verifying the machine classifications, bolstering the machine-learning training set and identifying new morphological classes of glitches. These classifications are now routinely used in studies characterizing the performance of the LIGO gravitational-wave detectors. Providing the volunteers with a training framework that teaches them to classify a wide range of glitches, as well as additional tools to aid their investigations of interesting glitches, empowers them to make discoveries of new classes of glitches. This demonstrates that, when giving suitable support, volunteers can go beyond simple classification tasks to identify new features in data at a level comparable to domain experts. The Gravity Spy project is now providing volunteers with more complicated data that includes auxiliary monitors of the detector to identify the root cause of glitches.

}, doi = {10.1140/epjp/s13360-023-04795-4}, author = {Michael Zevin and Corey B. Jackson and Zoheyr Doctor and Yunan Wu and Carsten {\O}sterlund and L. Clifton Johnson and Christopher P. L. Berry and Kevin Crowston and Scott B. Coughlin and Vicky Kalogera and Sharan Banagiri and Derek Davis and Jane Glanzer and Renzhi Hao and Aggelos K. Katsaggelos and Oli Patane and Jennifer Sanchez and Joshua Smith and Siddharth Soni and Laura Trouille and Marissa Walker and Irina Aerith and Wilfried Domainko and Victor-Georges Baranowski and Gerhard Niklasch and Barbara T{\'e}gl{\'a}s} } @article {9998, title = {Knowledge Tracing to Model Learning in Online Citizen Science Projects}, journal = {IEEE Transactions on Learning Technologies}, volume = {13}, year = {2020}, pages = {123-134}, abstract = {

We present the design of a citizen science system that uses machine learning to guide the presentation of image classification tasks to newcomers to help them more quickly learn how to do the task while still contributing to the work of the project. A Bayesian model for tracking volunteer learning for training with tasks with uncertain outcomes is presented and fit to data from 12,986 volunteer contributors. The model can be used both to estimate the ability of volunteers and to decide the classification of an image. A simulation of the model applied to volunteer promotion and image retirement suggests that the model requires fewer classifications than the current system.

}, issn = {1939-1382}, doi = {10.1109/TLT.2019.2936480 }, attachments = {https://crowston.syr.edu/sites/crowston.syr.edu/files/transaction\%20paper\%20final\%20figures\%20in\%20text.pdf}, author = {Kevin Crowston and Carsten {\O}sterlund and Tae Kyoung Lee and Corey Brian Jackson and Mahboobeh Harandi and Sarah Allen and Sara Bahaadini and Scott Coughlin and Aggelos Katsaggelos and Shane Larson and Neda Rohani and Joshua Smith and Laura Trouille and Michael Zevin} } @article {9999, title = {Teaching Citizen Scientists to Categorize Glitches using Machine-Learning-Guided Training}, journal = {Computers in Human Behavior}, volume = {105}, year = {2020}, pages = {106198}, abstract = {

Training users in online communities is important for making high performing contributors. However, several conundrums exists in choosing the most effective approaches to training users. For example, if it takes time to learn to do the task correctly, then the initial contributions may not be of high enough quality to be useful. We conducted an online field experiment where we recruited users (N = 386) in a web-based citizen-science project to evaluate the two training approaches. In one training regime, users received one-time training and were asked to learn and apply twenty classes to the data. In the other approach, users were gradually exposed to classes of data that were selected by trained machine learning algorithms as being members of particular classes. The results of our analysis revealed that the gradual training produced {\textquotedblleft}high performing contributors{\textquotedblright}. In our comparison of the treatment and control groups we found users who experienced gradual training performed significantly better on the task (an average accuracy of 90\% vs. 54\%), contributed more work (an average of 228 vs. 121 classifications), and were retained in the project for a longer period of time (an average of 2.5 vs. 2 sessions). The results suggests online production communities seeking to train newcomers would benefit from training regimes that gradually introduce them to the work of the project using real tasks.

}, doi = {10.1016/j.chb.2019.106198}, attachments = {https://crowston.syr.edu/sites/crowston.syr.edu/files/MLGT-preprint.pdf}, author = {Corey Jackson and Carsten {\O}sterlund and Kevin Crowston and Mahboobeh Harandi and Sarah Allen and Sara Bahaadini and Scott Coughlin and Vicky Kalogera and Aggelos Katsaggelos and Shane Larson and Neda Rohani and Joshua Smith and Laura Trouille and Michael Zevin} } @article {2019, title = {Classifying the unknown: Discovering novel gravitational-wave detector glitches using similarity learning}, journal = {Physical Review D}, volume = {99}, year = {2019}, pages = {082002}, abstract = {

The observation of gravitational waves from compact binary coalescences by LIGO and Virgo has begun a new era in astronomy. A critical challenge in making detections is determining whether loud transient features in the data are caused by gravitational waves or by instrumental or environmental sources. The citizen-science project Gravity Spy has been demonstrated as an efficient infrastructure for classifying known types of noise transients (glitches) through a combination of data analysis performed by both citizen volunteers and machine learning. We present the next iteration of this project, using similarity indices to empower citizen scientists to create large data sets of unknown transients, which can then be used to facilitate supervised machine-learning characterization. This new evolution aims to alleviate a persistent challenge that plagues both citizen-science and instrumental detector work: the ability to build large samples of relatively rare events. Using two families of transient noise that appeared unexpectedly during LIGO{\textquoteright}s second observing run, we demonstrate the impact that the similarity indices could have had on finding these new glitch types in the Gravity Spy program.

}, issn = {2470-0010}, doi = {10.1103/PhysRevD.99.082002}, author = {Scott Coughlin and Sara Bahaadini and Neda Rohani and Michael Zevin and Patane, Oli and Mahboobeh Harandi and Corey Brian Jackson and Noroozi, V. and Sarah Allen and Areeda, J. and Coughlin, M. and Ruiz, P. and Berry, C. P. L. and Kevin Crowston and Aggelos Katsaggelos and Andrew Lundgren and Carsten {\O}sterlund and Joshua Smith and Laura Trouille and Vicky Kalogera} } @article {657, title = {Gravity Spy: Integrating Advanced LIGO Detector Characterization, Machine Learning, and Citizen Science}, journal = {Classical and Quantum Gravity}, volume = {34}, year = {2017}, pages = {064003}, type = {Journal Article}, doi = {10.1088/1361-6382/aa5cea}, author = {Michael Zevin and Scott Coughlin and Sara Bahaadini and Emre Besler and Neda Rohani and Sarah Allen and Miriam Cabero and Kevin Crowston and Aggelos Katsaggelos and Shane Larson and Tae Kyoung Lee and Chris Lintott and Tyson Littenberg and Andrew Lundgren and Carsten Oesterlund and Joshua Smith and Laura Trouille and Vicky Kalogera} }