isle_pubs.bib

@string{aaai = {Proceedings of the National Conference on Artificial Intelligence}}
@string{icassp = "Proc. {ICASSP}"}
@string{iclr = "Proc. International Conference on Learning Representations (ICLR)"}
@string{icml = "Proc. International Conference on Machine Learning (ICML)"}
@string{interspeech = {Proc. {Interspeech}}}
@string{jasa = "J. Acoust. Soc. Am."}
@string{jsc = "Speech Communication"}
@string{jslhr = "Journal of Speech, Language, and Hearing Research"}
@string{slt = "{IEEE} Spoken Language Technology (SLT)"}

@inproceedings{singh2024comprehensive,
 author={Satwinder Singh and Zihan Zhong and Qianli Wang and Clarion Mendes and Mark Hasegawa-Johnson and Waleed Abdulla and Seyed Reza Shahamiri},
 title={A Comprehensive Performance Evaluation of Whisper Models in Dysarthric Speech Recognition},
 booktitle={International Conference on Neural Information Processing (ICONIP2024)},
 year={2024},
 month={12}
 }
 
@inproceedings{khan2024infantmotion2vec,
 author={Mohammad Nur Hossain Khan and Nancy McElwain and Mark Hasegawa-Johnson and Bashima Islam},
 title={InfantMotion2Vec: Unlabeled Data-Driven Infant Pose Estimation Using a Single Chest {IMU}},
 booktitle={IEEE International Conference on Wearable and Implantable Body Sensor Networks (BSN 2024)},
 year={2024},
 month={10}
 }

@inproceedings{ramig2024empathy,
 author={Lorraine Ramig and Heather Hodges and Clarion Mendes and Mark Hasegawa-Johnson},
 title={Empathy in Action: Recruiting and Training Individuals With Parkinsons Disease for Speech ASR Advancements},
 year={2024},
 booktitle={American Speech Language Hearing Association (ASHA) Annual Convention},
 note={unpublished presentation},
 month={12}
 }
 
@inproceedings{kim2024overview,
 author={Heejin Kim and Clarion Mendes and Mark Hasegawa-Johnson and Meg Dickinson and Erik Hege},
 title={An Overview of Speech Data in the Speech Accessibility Project: Speech Variations for Inclusive Technology},
 year={2024},
 booktitle={American Speech Language Hearing Association (ASHA) Annual Convention},
 note={unpublished presentation},
 month={12} 
 }
 
@unpublished{hasegawajohnson2023community,
 author={Mark Hasegawa-Johnson and Heejin Kim and Xiuwen Zheng and Meg Dickinson and Erik Hege and Clarion Mendes and Chris Zwilling and Shadi Abou-Zahra and Leah Findlater and Aaron Gustafson and Bob MacDonald and Mike Shebanek and Adina Bradshaw and Shawnise Carter and Blair Casey and Marie Moore Channell and Kayla Ferguson and Heather Hodges and Laura Mattie and Lorraine Ramig},
 title={Community-supported shared infrastructure in support of speech accessibility},
 note={Unpublished presentation at the ASHA 2023 Research Symposium},
 year={2023},
 volume={67},
 number={11},
 url={https://vimeo.com/911627521}
 }
 
@article{hasegawajohnson2024community,
 author={Mark Hasegawa-Johnson and Xiuwen Zheng and Heejin Kim and Clarion Mendes and Meg Dickinson and Erik Hege and Chris Zwilling and Marie Moore Channell and Laura Mattie and Heather Hodges and Lorraine Ramig and Mary Bellard and Mike Shebanek and Leda Sarı and Kaustubh Kalgaonkar and David Frerichs and Jeffrey P. Bigham and Leah Findlater and Colin Lea and Sarah Herrlinger and Peter Korn and Shadi Abou-Zahra and Rus Heywood and Katrin Tomanek and Bob MacDonald},
 title={Community-supported shared infrastructure in support of speech accessibility},
 journal={Journal of Speech Language and Hearing Research},
 year={2024},
 volume={67},
 number={10},
 url={https://pubs.asha.org/doi/10.1044/2024_JSLHR-24-00122},
 doi={10.1044/2024_JSLHR-24-00122}
 }
 
@article{harvill2024multimodal,
 title={Multimodal Respiratory Rate Estimation from Audio and Video in Emergency Department Patients},
 author={John Harvill and Moitreya Chatterjee and Shaveta Khosla and Mustafa Alam and Narendra Ahuja
 and Mark Hasegawa-Johnson and David Chestek and David Beiser},
 year={2024},
 url={https://ieeexplore.ieee.org/document/10570324},
 doi={10.1109/JTEHM.2024.3418345},
 issn={2168-2372},
 journal={IEEE Journal of Translational Engineering in Health and Medicine}
 }

@inproceedings{li2024enhancing,
title={Enhancing Child Vocalization Classification with Phonetically-Tuned Embeddings for Assisting Autism Diagnosis},
author={Jialu Li and Mark Hasegawa-Johnson and Karrie Karahalios},
booktitle=interspeech,
doi={10.21437/Interspeech.2024-540},
year={2024},
month={9}
}

@inproceedings{yoon2024litta,
title={LI-TTA: Language Informed Test-Time Adaptation for Automatic Speech Recognition},
author={Eunseop Yoon and Hee Suk Yoon and John Harvill and Mark Hasegawa-Johnson and Chang D. Yoo},
booktitle=interspeech,
doi={10.21437/Interspeech.2024-1829},
year={2024},
month={9}
}

@article{li2022visualizations,
  title={Visualizations of Complex Sequences of Family-Infant Vocalizations Using Bag-of-Audio-Words Approach Based on Wav2vec 2.0 Features},
  author={Li, Jialu and Hasegawa-Johnson, Mark and McElwain, Nancy L},
  journal={arXiv preprint arXiv:2203.15183},
  year={2022},
  url={https://arxiv.org/pdf/2203.15183}
}

@inproceedings{zheng2024fine,
title={Fine-Tuning Automatic Speech Recognition for People with Parkinson's: An Effective Strategy for Enhancing Speech Technology Accessibility},
author={Xiuwen Zheng and Bornali Phukon and Mark Hasegawa-Johnson},
doi={10.21437/Interspeech.2024-1969},
booktitle=interspeech,
year={2024},
month={9}
}

@inproceedings{gao2024speech,
 author={Heting Gao and Kaizhi Qian and Junrui Ni and Chuang Gan and Mark A. Hasegawa-Johnson and
 Shiyu Chang and Yang Zhang},
 title={Speech Self-Supervised Learning Using Diffusion Model Synthetic Data},
 booktitle=icml,
 year={2024},
 month={7},
 url={https://openreview.net/forum?id=ecnpYYHjt9}
 }

@inproceedings{hu2024real2,
 title={Real-Time Relations Between Prosodic Features of Infant-Directed Speech and Infant Attention at 3 Months},
 author={Yannan Hu and Nancy L. McElwain and Mark Hasegawa-Johnson},
 month={7},
 doi={10.21437/SpeechProsody.2024-45},
 year={2024},
 booktitle={Speech Prosody},
 pages={accepted for publication}
 }
 
@article{singh2024lightweight,
 title={Lightweight, Multi-speaker, Multi-lingual Indic Text-To-Speech},
 author={Abhayjeet Singh and Amala Nagireddi and Anjali Jayakumar and Deekshitha G and Jesuraja Bandekar and Roopa R and Sandhya Badiger and Sathvik Udupa and Saurabh Kumar and Prasanta Kumar Ghosh and Hema A Murthy and Heiga Zen and Pranaw Kumar and Kamal Kant and Amol Bole and Bira Chandra Singh and Keiichi Tokuda and Mark Hasegawa-Johnson and Philipp Olbrich},
 journal={IEEE Open Journal of Signal Processing},
 volume={5},
 issn={2644-1322},
 url={https://ieeexplore.ieee.org/document/10479171?source=authoralert},
 pages={790--798},
 doi={10.1109/OJSP.2024.3379092},
 year={2024},
 month={3}
 }

@article{cos2023importance,
 author={Eugene Cox and Mark Hasegawa-Johnson and Suma Bhat and Mukhil Umashankar and H Chad Lane and Daniel Morrow},
 title={The Importance of Diverse User Goals When Designing an Automated {COVID} Risk Counselor},
 url={https://journals.sagepub.com/doi/pdf/10.1177/2327857923121009},
 year={2023},
 month={3},
 pages={35--39},
 publisher={SAGE Publications},
 journal={Proceedings of the International Symposium on Human Factors and Ergonomics in Health Care},
 volume={12},
 number={1}
 }

@inproceedings{jahan2024finding,
 title={Finding Spoken Identifications: Using GPT-4 Annotation For An Efficient And Fast Dataset Creation Pipeline},
 author={Maliha Jahan and Helin Wang and Thomas Thebaud and Yinglun Sun and Giang Le and Zsuzsanna Fagyal and Odette Scharenborg and Mark Hasegawa-Johnson and Laureano Moro Velazquez and Najim Dehak},
 booktitle={LREC-COLING},
 year={2024},
 month={5},
 pages={7296-7306},
 url={https://aclanthology.org/2024.lrec-main.641/}
 }
 

@inproceedings{hu2024real,
 author={Yannan Hu and Nancy L. McElwain and Mark Hasegawa-Johnson},
 year={2024},
 month={July},
 title={Real-time relations between fundamental frequency of infant-directed speech and infant attention at 3 months},
 note={Poster presentation},
 booktitle={24th International Congress of Infant Studies (ICIS)},
 address={Glasgow, Scotland}
 }

@inproceedings{yoon2024calibrated,
 author={Hee Suk Yoon and Eunseop Yoon and Joshua Tian Jin Tee and Mark A. Hasegawa-Johnson
 and Yingzhen Li and Chang D. Yoo},
 title={{C-TPT}: Calibrated Test-Time Prompt Tuning for Vision-Language Models via Text Feature Dispersion},
 booktitle=iclr,
 year={2024},
 month={5},
 url={https://iclr.cc/virtual/2024/poster/17996}
} 

@article{islam2024preliminary,
 author={Bashima Islam and Nancy L McElwain and Jialu Li and Maria Davila and Yannan Hu and Kexin Hu and Jordan M Bodway and Ashutosh M Dhekne and Romit Roy Choudhury and Mark Hasegawa-Johnson},
 title={Preliminary Technical Validation of LittleBeats™: A Multimodal Sensing Platform to Capture Cardiac Physiology, Motion, and Vocalizations},
 doi={https://www.mdpi.com/1424-8220/24/3/901},
 journal={Sensors},
 volume={24},
 number={3},
 doi={10.3390/s24030901},
 year={2024},
 month={1},
 number={2024010906}
 }
 
@inproceedings{wang2024unsupervised,
 author={Liming Wang and Mark Hasegawa-Johnson and Chang Yoo},
 title={Unsupervised Speech Recognition with N-Skipgram and Positional Unigram Matching},
 booktitle=icassp,
 doi={10.1109/ICASSP48485.2024.10446327},
 year={2024},
 number={4604}
 }

@inproceedings{gao2024g2pu,
 author={Heting Gao and Mark Hasegawa-Johnson and Chang D. Yoo},
 title={G2PU: Grapheme-to-Phoneme Transducer with Speech Units},
 doi={10.1109/ICASSP48485.2024.10448105},
 booktitle=icassp,
 year={2024},
 number={1746}
 }

@article{mcelwain2024evaluating,
 title={Evaluating Users’ Experiences of a Child Multimodal Wearable Device: A Mixed Methods Approach},
 author={Nancy McElwain and Bashima Islam and Meghan Fisher and Camille Nebeker and Jordan Marie Bodway and Mark Hasegawa-Johnson},
 journal={JMIR Human Factors},
  volume={11},
  pages={e49316},
  year={2024},
  publisher={JMIR Publications Toronto, Canada},
  doi={10.2196/49316}
 }

@inproceedings{li2023towards,
 author={Jialu Li and Mark Hasegawa-Johnson and Nancy McElwain},
 title={Towards Robust Family-Infant Audio Analysis Based on Unsupervised Pretraining of Wav2vec 2.0 on Large-Scale Unlabeled Family Audio},
 booktitle=interspeech,
doi={10.21437/Interspeech.2023-460}, 
 url={https://arxiv.org/abs/2305.12530},
 year={2023},
 keywords={analysis}
}

@inproceedings{qian2022contentvec,
 author={Kaizhi Qian and Yang Zhang and Heting Gao and Junrui Ni and C.-I. Lai and David Cox
 and Mark Hasegawa-Johnson and Shiyu Chang},
 title={Contentvec: An improved selfsupervised speech representation by disentangling speakers},
 booktitle=icml,
 year={2022},
 pages={18003--18017},
 url={https://proceedings.mlr.press/v162/qian22b/qian22b.pdf}
 }

@inproceedings{kang2022forget,
 author={Haeyong Kang and Rusty John Lloyd Mina and Sultan Rizky Hikmawan Madjid and Jaehong Yoon and Mark Hasegawa-Johnson and Sung Ju Hwang and Chang D Yoo},
 title={Forget-free continual learning with winning subnetworks},
 url={https://proceedings.mlr.press/v162/kang22b.html},
 booktitle=icml,
 year={2022},
 month={6},
 pages={10734-10750},
 volume={162}
 }

@article{li2021analysis,
 author={Jialu Li and Mark Hasegawa-Johnson and Nancy McElwain},
 title={Analysis of Acoustic and Voice Quality Features for the Classification of Infant and Mother Vocalizations},
 doi={10.1016/j.specom.2021.07.010},
 journal=jsc,
 volume={133},
 pages={41-61},
 year={2021},
 keywords={analysis}
}

@inproceedings{xu2018infant,
 author={Yijia Xu and Mark Hasegawa-Johnson and Nancy L. McElwain},
 title={Infant emotional outbursts detection in infant-parent spoken interactions},
 booktitle=interspeech,
 year={2018},
 pages={242--246},
 doi={10.21437/Interspeech.2018-2429},
 keywords={analysis}
}

@inproceedings{he2017using,
 author={Di He and Zuofu Cheng and Mark Hasegawa-Johnson and Deming Chen},
 title={Using Approximated Auditory Roughness as a Pre-filtering Feature for Human Screaming and Affective Speech AED},
 booktitle={Proc. Interspeech},
 year={2017},
 keywords={analysis},
  pages={1914--1918},
  doi={10.21437/Interspeech.2017-593} 
}

@phdthesis{pietrowicz2017exposing,
 author={Mary Pietrowicz},
 title={Exposing the Hidden Vocal Channel: Analysis of Vocal Expression},
 url={https://www.ideals.illinois.edu/items/105321},
 year={2017},
 school={University of Illinois},
 keywords={analysis}
}

@inproceedings{pietrowicz2017discovering,
 author={Mary Pietrowicz and Mark Hasegawa-Johnson and Karrie Karahaliqos},
 title={Discovering Dimensions of Perqceived Vocal Expression in Semi-Structured, Unscripted Oral History Accoqunts},
 doi={10.1109/ICASSP.2017.7953247},
 booktitle={Proc. ICASSP},
 pages={2901:1-4},
 year={2017},
 keywords={analysis}
}

@inproceedings{pietrowicz2015acoustic,
 author={Mary Pietrowicz and Mark Hasegawa-Johnson and Karrie Karahalios},
 title={Acoustic Correlates for Perceived Effort Levels in Expressive Speech},
 booktitle=interspeech,
 year={2015},
 pages={3720--3724},
  doi={10.21437/Interspeech.2015-738}, 
 keywords={analysis}
}

@article{mathur2012detecting,
 author={Shobhit Mathur and Marshall Scott Poole and Feniosky Pena-Mora and Mark Hasegawa-Johnson and Noshir Contractor},
 title={Detecting interaction links in a collaborating group using manually annotated data},
 journal={Social Networks},
 doi={10.1016/j.socnet.2012.04.002},
 year={2012},
 grant={NSF 0941268},
 keywords={analysis}
}

@inproceedings{tang2009emotion,
 author={Hao Tang and Stephen M. Chu and Mark Hasegawa-Johnson and Thomas S. Huang},
 title={Emotion Recognition from Speech via Boosted Gaussian Mixture Models},
 doi={10.1109/ICME.2009.5202493},
 year={2009},
 booktitle={International Conference on Multimedia \& Expo (ICME'09)},
 pages={294-297},
 grant={NIH R21 DC008090 A},
 keywords={analysis}
}

@article{zhang2006cognitive,
 author={Tong Zhang and Mark Hasegawa-Johnson and Stephen E. Levinson},
 title={Cognitive State Classification in a spoken tutorial dialogue system},
 doi={10.1016/j.specom.2005.09.006},
 journal=jsc,
 volume={48},
 number={6},
 page={616-632},
 year={2006},
 grant={NSF 0085980},
 keywords={analysis}
}

@inproceedings{hasegawajohnson04automatic,
  author={Mark Hasegawa-Johnson and Stephen Levinson and Tong Zhang},
  title={{Automatic detection of contrast for speech understanding}},
  year=2004,
  booktitle={Proc. Interspeech 2004},
  pages={581--584},
  doi={10.21437/Interspeech.2004-223},
  keywords={analysis}
}

@inproceedings{zhang2003an,
 author={Tong Zhang and Mark Hasegawa-Johnson and Stephen E. Levinson},
 title={An empathic-tutoring system using spoken language},
 url={https://www.researchgate.net/profile/Stephen-Levinson-2/publication/228805591_An_Empathic-tutoring_System_Using_Spoken_Language/links/54d389ac0cf2b0c6146dabde/An-Empathic-tutoring-System-Using-Spoken-Language.pdf},
 booktitle={Australian conference on computer-human interactionq (OZCHI)},
 year={2003},
 pages={498-501},
 grant={NSF 0085980},
 keywords={analysis}
}

@inproceedings{zhang000013mental,
 author={Tong Zhang and Mark Hasegawa-Johnson and Stephen E. Levinson},
 title={Mental State Detection of Dialogue System Users via Spoken Language},
 url={https://www.isca-speech.org/archive/sspr_2003/zhang03_sspr.html},
 booktitle={ISCA/IEEE Workshop on Spontaneous Speech Processing and Recognition (SSPR)},
 month={April},
 year={2003},
 pages={MAP17.1-4},
 grant={NSF 0085980},
 keywords={analysis}
}

@inproceedings{zhai2023wav2tobi,
 author={Wanyue Zhai and Mark Hasegawa-Johnson},
 title={{Wav2ToBI}: a new approach to automatic {ToBI} transcription},
 booktitle=interspeech,
 doi={10.21437/Interspeech.2023-477},
 year={2023},
 keywords={analysis}
}

@incollection{rosenberg2021oxford,
 author={Andrew Rosenberg and Mark Hasegawa-Johnson},
 title={Automatic Prosody Labeling and Assessment},
 booktitle={Oxford Handbook of Language Prosody},
 doi={10.1093/oxfordhb/9780198832232.013.43},
 editor={Carlos Gussenhoven and Aoju Chen},
 pages={646--656},
 publisher={Oxford University Press},
 year={2021},
 keywords={analysis}
}

@inproceedings{mahrt2011feature,
 author={Tim Mahrt and Jui-Ting Huang and Yoonsook Mo and Jennifer Cole and Mark Hasegawa-Johnson and Margaret Fleck},
 title={Feature Sets for the Automatic Detection of Prosodic Prominence},
 booktitle={New Tools and Methods for Very Large Scale Phonetics Research},
 publisher={University of Pennsylvania},
 month={Jan.},
 year={2011},
 keywords={analysis}
}

@inproceedings{huang2008unsupervised,
 author={Jui-Ting Huang and Mark Hasegawa-Johnson},
 title={Unsupervised Prosodic Break Detection in Mandarin Speech},
 url={https://www.isca-speech.org/archive/speechprosody_2008/huang08_speechprosody.html},
 booktitle={SpeechProsody},
 year={2008},
 pages={165-168},
 grant={NSF 0534133},
 keywords={analysis}
}

@inproceedings{zhuang2008towards,
 author={Xiaodan Zhuang and Mark Hasegawa-Johnson},
 title={Towards Interpretation of Creakiness in Switchboard},
 url={https://www.isca-speech.org/archive/speechprosody_2008/zhuang08_speechprosody.html},
 booktitle={SpeechProsody},
 year={2008},
 pages={37-40},
 grant={NSF 0414117},
 keywords={analysis}
}

@inproceedings{yoon000019detecting,
 author={Taejin Yoon and Jennifer Cole and Mark Hasegawa-Johnson},
 title={Detecting Non-Modal Phonation in Telephone Speech},
 url={https://www.isca-speech.org/archive/speechprosody_2008/yoon08_speechprosody.html},
 booktitle={SpeechProsody},
 year={2008},
 pages={33-36},
 grant={NSF 0414117},
 keywords={analysis}
}

@phdthesis{yoon2007a,
 author={Taejin Yoon},
 title={A Predictive Model of Prosody Through Grammatical Interface: A Computational Approach},
 url={https://www.ideals.illinois.edu/items/83925},
 year={2007},
 school={University of Illinois},
 keywords={analysis}
}

@article{zhang2007extraction,
 author={Tong Zhang and Mark Hasegawa-Johnson and Stephen E. Levinson},
 title={Extraction of Pragmatic and Semantic Salience from Spontaneous Spoken English},
 doi={10.1016/j.specom.2005.07.007},
 journal=jsc,
 year={2007},
 grant={NSF 0085980},
 keywords={analysis}
}

@inproceedings{reddy2006mclc,
 author={Rajiv Reddy and Mark Hasegawa-Johnson},
 title={Analysis of Pitch Contours in Repetition-Disfluency using Stem-ML},
 url={https://www.researchgate.net/profile/Rajiv-Reddy-7/publication/228967280_Analysis_of_Pitch_Contours_in_Repetition-Disfluency_using_Stem-ML/links/00b49536b0b12a63e2000000/Analysis-of-Pitch-Contours-in-Repetition-Disfluency-using-Stem-ML.pdf},
 booktitle={Midwest Computational Linguistics Colloquium},
 year={2006},
 keywords={analysis}
}

@inproceedings{yoon2008detecting,
 author={Tae-Jin Yoon and Cole and Jennifer and Mark Hasegawa-Johnson and Chilin Shih},
 title={Detecting Non-modal Phonation in Telephone Speech},
 url={https://www.isca-archive.org/speechprosody_2008/yoon08_speechprosody.pdf},
 booktitle={Proc. Speech Prosody},
 year={2008},
 grant={NSF 0414117},
 keywords={analysis}
}

@article{yoon2005acoustic,
 author={Tae-Jin Yoon and Cole and Jennifer and Mark Hasegawa-Johnson and Chilin Shih},
 year={2005},
 title={Acoustic correlates of non-modal phonation in telephone speech},
 doi={10.1121/1.4778287},
 journal={The Journal of the Acoustical Society of America},
 volume={117},
 number={4},
 pages={2621},
 grant={NSF 0414117},
 keywords={analysis}
}

@inproceedings{hasegawajohnson2004automatic,
  author={Mark Hasegawa-Johnson and Stephen Levinson and Tong Zhang},
  title={{Automatic detection of contrast for speech understanding}},
  year=2004,
  booktitle={Proc. Interspeech 2004},
  pages={581--584},
  doi={10.21437/Interspeech.2004-223},
  grant={NSF 0085980}
}

@inproceedings{borys000029modeling,
 author={Sarah Borys and Mark Hasegawa-Johnson and Ken Chen and Aaron Cohen},
 title={Modeling and Recognition of Phonetic and Prosodic Factors for Improvements to Acoustic Speech Recognition Models},
 booktitle=interspeech,
 month={October},
 year={2004},
 pages={3013--3016},
 doi={10.21437/Interspeech.2004-756},
 grant={NSF 0132900},
 keywords={analysis}
}

@inproceedings{chen2004maximum,
 author={Ken Chen and Mark Hasegawa-Johnson and Aaron Cohen and Jennifer Cole},
 title={A Maximum Likelihood Prosody Recognizer},
 url={https://www.isca-speech.org/archive/speechprosody_2004/chen04b_speechprosody.html},
 booktitle={SpeechProsody},
 year={2004},
 address={Nara, Japan},
 month={March},
 pages={509-512},
 grant={NSF 0132900},
 keywords={analysis}
}

@inproceedings{chen2004an,
 author={Ken Chen and Mark Hasegawa-Johnson},
 title={An Automatic Prosody Labeling System Using ANN-Based Syntactic-Prosodic Model and GMM-Based Acoustic-Prosodic Model},
 doi={10.1109/ICASSP.2004.1326034},
 booktitle={ICASSP},
 year={2004},
 grant={NSF 0132900},
 keywords={analysis}
}

@article{kim2004automatic,
 author={Sung-Suk Kim and Mark Hasegawa-Johnson and Ken Chen},
 title={Automatic Recognition of Pitch Movements Using Multilayer Perceptron and Time-Delay Recursive Neural Network},
 doi={10.1109/LSP.2004.830114},
 journal={IEEE Signal Processing Letters},
 volume={11},
 number={7},
 pages={645-648},
 year={2004},
 grant={NSF 0132900},
 keywords={analysis}
}

@inproceedings{ren2004speaker,
 author={Yuexi Ren and Sung-Suk Kim and Mark Hasegawa-Johnson and Jennifer Cole},
 title={Speaker-Independent Automatic Detection of Pitch Accent},
 booktitle={Proc. Speech Prosody 2004},
 pages={521--524},
 url={https://www.isca-speech.org/archive/speechprosody_2004/ren04_speechprosody.html},
 year={2004},
 address={Nara, Japan},
 month={March},
 grant={NSF 0085980},
 keywords={analysis}
}

@inproceedings{chen2003an,
 author={Ken Chen and Mark Hasegawa-Johnson and Sung-Suk Kim},
 title={An Intonational Phrase Boundary and Pitch Accent Dependent Speech Recognizer},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=e9e5670e89cc257c290bc5787bb0c46ffc6061fa},
 booktitle={International Conference on Systems, Cybernetics, and Intelligence},
 year={2003},
 keywords={analysis}
}

@inproceedings{chen2003improving,
 author={Ken Chen and Mark Hasegawa-Johnson},
 title={Improving the robustness of prosody dependent language modeling based on prosody syntax cross-correlation},
 doi={10.1109/ASRU.2003.1318480},
 booktitle={ASRU},
 year={2003},
 keywords={analysis}
}

@inproceedings{zhu2021a,
 author={Junzhe Zhu and Mark Hasegawa-Johnson and Nancy McElwain},
 title={A Comparison Study on Infant-Parent Voice Diarization},
 doi={10.1109/ICASSP39728.2021.9413538},
 booktitle={Proc. ICASSP},
 year={2021},
 pages={7178-7182},
 keywords={analysis}
}

@inproceedings{zhu2020identify,
 author={Junzhe Zhu and Mark Hasegawa-Johnson and Leda Sari},
 title={Identify Speakers in Cocktail Parties with End-to-End Attention},
 url={https://arxiv.org/pdf/2005.11408.pdf},
 booktitle={Proc. Interspeech},
 year={2020},
 pages={3092--3096},
 keywords={analysis},
  doi={10.21437/Interspeech.2020-2430}
}

@inproceedings{sari2019pre-training,
 author={Leda Sari and Samuel Thomas and Mark Hasegawa-Johnson and Michael Picheny},
 title={Pre-Training of Speaker Embeddings for Low-Latency Speaker Change Detection in Broadcast News},
 doi={10.1109/ICASSP.2019.8683612},
 booktitle={Proc. ICASSP},
 year={2019},
 pages={3093:1-5},
 keywords={analysis}
}

@unpublished{qian2014regularized,
 author={Kaizhi Qian},
 title={Regularized Estimation of Gaussian Mixture Models for SVM Based Speaker Recognition},
 url={https://www.ideals.illinois.edu/items/55611},
 note={B.S. Thesis, University of Illinois},
 year={2014},
 keywords={analysis}
}

@article{tang2012partially,
 author={Hao Tang and Stephen Chu and Mark Hasegawa-Johnson and Thomas Huang},
 title={Partially Supervised Speaker Clustering},
 doi={10.1109/TPAMI.2011.174},
 journal={IEEE Transactions on Pattern Analysis and Machine Intelligence},
 volume={34},
 number={5},
 pages={959-971},
 year={2012},
 keywords={analysis}
}

@inproceedings{harwath2010phonetic,
 author={David Harwath and Mark Hasegawa-Johnson},
 title={Phonetic Landmark Detection for Automatic Language Identification},
 url={https://www.isca-speech.org/archive/speechprosody_2010/harwath10_speechprosody.html},
 booktitle={Speech Prosody},
 year={2010},
 pages={100231:1-4},
 grant={NSF 0703624},
 keywords={analysis}
}

@inproceedings{zhou2007robust,
 author={Xi Zhou and Yu Fun and Ming Liu and Mark Hasegawa-Johnson and Thomas Huang},
 title={Robust Analysis and Weighting on MFCC Components for Speech Recognition and Speaker Identification},
 doi={10.1109/ICME.2007.4284618},
 booktitle={International Conference on Multimedia and Expo},
 year={2007},
 pages={188-191},
 grant={NSF 0426627},
 keywords={analysis}
}

@inproceedings{liu2007exploring,
 author={Ming Liu and Zhengyou Zhang and Mark Hasegawa-Johnson and Thomas Huang},
 title={Exploring Discriminative Learning for Text-Independent Speaker Recognition},
 doi={10.1109/ICME.2007.4284585},
 booktitle={ICME},
 year={2007},
 pages={56-59},
 grant={NSF 0426627},
 keywords={analysis}
}

@inproceedings{hasegawa-johnson2009visual,
 author={Mark Hasegawa-Johnson and Camille Goudeseune and Kai-Hsiang Lin and David Cohen and Xi Zhou and Xiaodan Zhuang and Kyungtae Kim and Hank Kaczmarski and Thomas Huang},
 title={Visual Analytics for Audio},
 booktitle={NIPS Workshop on Visual Analytics},
 year={2009},
 grant={NSF 0807329},
 keywords={analysis}
}

@unpublished{hasegawa-johnson2009pattern,
 author={Mark Hasegawa-Johnson},
 title={Pattern Recognition in Acoustic Signal Processing},
 note={Unpublished presentation at the Machine Learning Summer School, University of Chicago},
 year={2009},
 grant={NSF 0807329},
 keywords={analysis}
}

@article{hasegawa-johnson2009tutorial,
 author={Mark Hasegawa-Johnson},
 title={Tutorial: Pattern Recognition in Signal Processing},
 doi={10.1121/1.4784323},
 journal=jasa,
 volume={125},
 pages={2698},
 year={2009},
 grant={NSF 0803219},
 keywords={analysis}
}

@inproceedings{sakr2012topic,
 author={Ali Sakr and Mark Hasegawa-Johnson},
 title={Topic Modeling of Phonetic Latin-Spelled Arabic for the Relative Analysis of Genre-Dependent and Dialect-Dependent Variation},
 url={https://www.academia.edu/download/86879040/06fr-rist20-2.pdf},
 booktitle={CITALA},
 year={2012},
 pages={153-158},
 isbn={978-9954-9135-0-5},
 grant={QNRF NPRP 410-1-069},
 keywords={analysis}
}

@unpublished{al-sabbagh2011using,
 author={Rania Al-Sabbagh and Roxana Girju and Mark Hasegawa-Johnson and Elabbas Benmamoun and Rehab Duwairi and Eiman Mustafawi},
 title={Using Web Mining Techniques to Build a Multi-Dialect Lexicon of Arabic},
 note={Talk delivered at the Linguistics in the Gulf Conference},
 year={2011},
 keywords={analysis}
}

@inproceedings{zhang2015multichannel,
 author={Yang Zhang and Nasser Nasrabadi and Mark Hasegawa-Johnson},
 title={Multichannel Transient Acoustic Signal Classification Using Task-Driven Dictionary with Joint Sparsity and Beamforming},
 doi={10.1109/ICASSP.2015.7178294},
 booktitle={Proc. ICASSP},
 year={2015},
 pages={2591:1--5},
 grant={ARO W911NF-09-1-0383},
 keywords={analysis}
}

@article{chen2013mixed,
 author={Austin Chen and Mark Hasegawa-Johnson},
 title={Mixed Stereo Audio Classification Using a Stereo-Input Mixed-to-Panned Level Feature},
 journal={IEEE Trans. Speech and Audio Processing},
 volume={22},
 number={12},
 pages={2025-2033},
 year={2014},
 doi={10.1109/TASLP.2014.2359628},
 grant={QNRF NPRP 09-410-1-069},
 keywords={analysis}
}

@misc{hasegawa-johnson2014probabilistic,
 author={Mark Hasegawa-Johnson},
 title={Probabilistic Segmental Model For Doppler Ultrasound Heart Rate Monitoring},
 url={http://www.google.com/patents/US8727991},
 howpublished={United States Patent Number 8727991},
 month={May},
 year={2014},
 keywords={analysis}
}

@article{mertens2013on,
 author={Robert Mertens and Po-Sen Huang and Luke Gottlieb and Gerald Friedland and Ajay Divakaran and Mark Hasegawa-Johnson},
 title={On the Application of Speaker Diarization to Audio Indexing of Non-Speech and Mixed Non-Speech/Speech Video Soundtracks},
 journal={International Journal of Multimedia Data Engineering and Management (IJDEM)},
 month={April},
 year={2013},
 volume={3},
 number={3},
 pages={1--19},
 doi={10.4018/jmdem.2012070101},
 keywords={analysis}
}

@inproceedings{huang2012opportunistic,
 author={Po-Sen Huang and Mark Hasegawa-Johnson and Wotao Yin and Tom Huang},
 title={Opportunistic Sensing: Unattended Acoustic Sensor Selection Using Crowdsourcing Models},
 doi={10.1109/MLSP.2012.6349815},
 booktitle={IEEE Workshop on Machine Learning in Signal Processing},
 year={2012},
 keywords={analysis}
}

@inproceedings{huang2012pooling,
 author={Po-Sen Huang and Jianchao Yang and Mark Hasegawa-Johnson and Feng Liang and Thomas S. Huang},
 title={Pooling Robust Shift-Invariant Sparse Representations of Acoustic Signals},
 booktitle=interspeech,
 year={2012},
 keywords={analysis},
  pages={2518--2521},
  doi={10.21437/Interspeech.2012-652}
} 

@unpublished{hasegawa-johnson2012toward,
 author={Mark Hasegawa-Johnson and Xiaodan Zhuang and Xi Zhou and Camille Goudeseune and Hao Tang and Kai-Hsiang Lin and Mohamed Omar and Thomas Huang},
 title={Toward Better Real-world Acoustic Event Detection},
 note={Unpublished presentation given at Seoul National University},
 month={May},
 year={2012},
 keywords={analysis}
}

@inproceedings{huang2012how,
 author={Po-Sen Huang and Robert Mertens and Ajay Divakaran and Gerald Friedland and Mark Hasegawa-Johnson},
 title={How to Put it into Words---Using Random Forests to Extract Symbol Level Descriptions from Audio Content for Concept Detection},
 doi={10.1109/ICASSP.2012.6287927},
 booktitle={ICASSP},
 year={2012},
 grant={ARO W911NF-09-1-0383},
 keywords={analysis}
}


@inproceedings{mertens2011on,
 author={R. Mertens and P.-S. Huang and L. Gottlieb and G. Friedland and A. Divakaran},
 title={On the Application of Speaker Diarization to Audio Concept Detection for Multimedia Retrieval},
 doi={10.1109/ISM.2011.79},
 booktitle={IEEE International Symposium on Multimedia},
 pages={446-451},
 year={2011},
 keywords={analysis}
}

@inproceedings{huang2011exemplar,
 author={Po-Sen Huang and Mark Hasegawa-Johnson and Thyagaraju Damarla},
 title={Exemplar Selection Methods to Distinguish Human from Animal Footsteps},
 url={https://posenhuang.github.io/papers/Exemplar_Selection_HLVD2011.pdf},
 booktitle={Second Annual Human and Light Vehicle Detection Workshop},
 address={Maryland},
 pages={14:1-10},
 year={2011},
 grant={ARO W911NF-09-1-0383},
 keywords={analysis}
}

@inproceedings{huang2011multi-sensory,
 author={Po-Sen Huang and Thyagaraju Damarla and Mark Hasegawa-Johnson},
 title={Multi-sensory features for Personnel Detection at Border Crossings},
 url={https://ieeexplore.ieee.org/abstract/document/5977673?casa_token=APIqmZlnHDcAAAAA:66fMhlnUcKNXV6jKVFSz0hCDsoABgGyblOhRExzAtqjMs4XMBCJ8zPfVAnhT-yJg2Bz4rOpkfw},
 booktitle={Fusion},
 year={2011},
 grant={ARO W911NF-09-1-0383},
 keywords={analysis}
}

@phdthesis{zhuang2011modeling,
 author={Xiaodan Zhuang},
 title={Modeling Audio and Visual Cues for Real-world Event Detection},
 url={https://www.ideals.illinois.edu/items/24703},
 school={University of Illinois},
 month={April},
 year={2011},
 keywords={analysis}
}

@inproceedings{huang2011improving,
 author={Po-Sen Huang and Xiaodan Zhuang and Mark Hasegawa-Johnson},
 title={Improving Acoustic Event Detection using Generalizable Visual Features and Multi-modality Modeling},
 doi={10.1109/ICASSP.2011.5946412},
 booktitle={ICASSP},
 year={2011},
 pages={349-352},
 grant={ARO W911NF-09-1-0383},
 keywords={analysis}
}

@article{zhuang2010real-world,
 author={Xiaodan Zhuang and Xi Zhou and Mark A. Hasegawa-Johnson and Thomas S. Huang},
 title={Real-world Acoustic Event Detection},
 doi={10.1016/j.patrec.2010.02.005},
 journal={Pattern Recognition Letters},
 volume={31},
 number={2},
 month={Sep.},
 year={2010},
 pages={1543-1551},
 grant={NSF 0807329},
 keywords={analysis}
}

@article{hasegawa-johnson2009adaptation,
 author={Mark Hasegawa-Johnson and Xiaodan Zhuang and Xi Zhou and Camille Goudeseune and Thomas S. Huang},
 title={Adaptation of tandem HMMs for non-speech audio event detection},
 doi={10.1121/1.4784503},
 journal=jasa,
 volume={125},
 pages={2730},
 year={2009},
 keywords={analysis}
}

@inproceedings{zhuang2009acoustic,
 author={Xiaodan Zhuang and Jing Huang and Gerasimos Potamianos and Mark Hasegawa-Johnson},
 title={Acoustic Fall Detection using Gaussian Mixture Models and GMM Supervectors},
 doi={10.1109/ICASSP.2009.4959522},
 booktitle={ICASSP},
 year={2009},
 pages={69-72},
 keywords={analysis}
}

@inproceedings{zhuang000070feature,
 author={Xiaodan Zhuang and Xi Zhou and Thomas S. Huang and Mark Hasegawa-Johnson},
 title={Feature Analysis and Selection for Acoustic Event Detection},
 doi={10.1109/ICASSP.2008.4517535},
 booktitle={ICASSP},
 pages={17-20},
 year={2008},
 grant={NSF 0414117},
 keywords={analysis}
}

@article{zhou000071hmm-based,
 author={Xi Zhou and Xiaodan Zhuang and Ming Lui and Hao Tang and Mark Hasegawa-Johnson and Thomas Huang},
 title={HMM-Based Acoustic Event Detection with AdaBoost Feature Selection},
 doi={10.1007/978-3-540-68585-2_33},
 journal={Lecture Notes in Computer Science},
 year={2008},
 volume={4625},
 pages={345-353},
 grant={NSF 0414117},
 keywords={analysis}
}

@inproceedings{yang2016landmarkbased,
 author={Xuesong Yang and Xiang Kong and Mark Hasegawa-Johnson and Yanlu Xie},
 title={Landmark-based Pronunciation Error Identification on {L2 Mandarin Chinese}},
 pages={247--251},
 doi={10.21437/SpeechProsody.2016-51},
 booktitle={Speech Prosody},
 year={2016},
 keywords={analysis}
}

@inproceedings{bhat2010interspeech,
 author={Suma Bhat and Mark Hasegawa-Johnson and Richard Sproat},
 title={Automatic Fluency Assessment by Signal-Level Measurement of Spontaneous Speech},
 url={https://www.isca-speech.org/archive/l2ws_2010/bhat10_l2ws.html},
 year={2010},
 booktitle={INTERSPEECH Satellite Workshop on Second Language Studies: Acquisition, Learning, Education and Technology},
 keywords={analysis}
}

@inproceedings{yoon2010landmark-based,
 author={Su-Youn Yoon and Mark Hasegawa-Johnson and Richard Sproat},
 title={Landmark-based Automated Pronunciation Error Detection},
 booktitle={Proceedings of Interspeech},
 year={2010},
 pages={614--617},
 doi={10.21437/Interspeech.2010-236}, 
 keywords={analysis}
}

@inproceedings{bhat2010language,
 author={Suma Bhat and Richard Sproat and Mark Hasegawa-Johnson and Fred Davidson},
 title={Automatic fluency assessment using thin-slices of spontaneous speech},
 booktitle={Language Testing Research Colloquium},
 year={2010},
 address={Denver, CO},
 keywords={analysis}
}

@inproceedings{yoon2009interspeech,
  author={Su-Youn Yoon and Mark Hasegawa-Johnson and Richard Sproat},
 title={Automated Pronunciation Scoring using Confidence Scoring and Landmark-based SVM},
 booktitle=interspeech,
  pages={1903--1906},
  doi={10.21437/Interspeech.2009-551},
 address={Brighton},
 month={September},
 year={2009},
 keywords={analysis}
}

@inproceedings{yoon2009calico,
 author={Su-Youn Yoon and Mark Hasegawa-Johnson and Richard Sproat},
 title={Automated Pronunciation Scoring for L2 English Learners},
 booktitle={CALICO workshop},
 year={2009},
 keywords={analysis}
}

@inproceedings{zhang2004children,
 author={Mark Hasegawa-Johnson and Stephen E. Levinson and Tong Zhang},
 title={Children's Emotion Recognition in an Intelligent Tutoring Scenario},
 booktitle=interspeech,
 month={October},
 year={2004},
 grant={NSF 0085980},
 pages={1441--1444},
 doi={10.21437/Interspeech.2004-552}, 
 keywords={analysis}
}

@inproceedings{harvill22_interspeech,
  author={John Harvill and Mark Hasegawa-Johnson and Chang D. Yoo},
  title={{Frame-Level Stutter Detection}},
  year=2022,
  booktitle={Proc. Interspeech 2022},
  pages={2843--2847},
  doi={10.21437/Interspeech.2022-204}
}

@inproceedings{harvill2022estimation,
 author={John Harvill and Yash Wani and Narendra Ahuja and Mark Hasegawa-Johnson and David Chestek and Mustafa Alam and David Beiser},
 title={Estimation of Respiratory Rate from Breathing Audio},
 url={https://ieeexplore.ieee.org/document/9871897},
 booktitle={44th Annual International Conference of the IEEE Engineering in Medicine and Biology Society},
 year={2022},
 keywords={analysis}
}

@inproceedings{harvill2021classification,
 author={John Harvill and Yash R. Wani and Mark Hasegawa-Johnson and Narendra Ahuja and David Beiser and David Chestek},
 title={{Classification of COVID-19 from Cough Using Autoregressive Predictive Coding Pretraining and Spectral Data Augmentation}},
 booktitle={Proc. Interspeech},
 year={2021},
 keywords={analysis},
  pages={926--930},
  doi={10.21437/Interspeech.2021-799} 
}

@inproceedings{abavisani000086automatic,
 author={Ali Abavisani and Mark Hasegawa-Johnson},
 title={Automatic Estimation of Intelligibility Measure for Consonants in Speech},
 url={https://arxiv.org/abs/2005.06065},
 booktitle={Proc. Interspeech},
 year={2020},
 keywords={analysis},
  pages={1161--1165},
  doi={10.21437/Interspeech.2020-2121}
} 

@article{rong2012relationship,
 author={Panying Rong and Torrey Loucks and Heejin Kim and Mark Hasegawa-Johnson},
 title={Relationship between kinematics, F2 slope and speech intelligibility in dysarthria due to cerebral palsy},
 journal={Clinical Linguistics and Phonetics},
 month={September},
 year={2012},
 volume={26},
 number={9},
 pages={806-822},
 doi={10.3109/02699206.2012.706686},
 keywords={analysis}
}

@article{kim2011temporal,
 author={Heejin Kim and Mark Hasegawa-Johnson and Adrienne Perlman},
 title={Temporal and spectral characteristics of fricatives in dysarthria},
 journal={Journal of the Acoustical Society of America},
 volume={130},
 pages={2446},
 doi={10.1121/1.3654821},
 year={2011},
 keywords={analysis}
}

@article{kim2011vowel,
 author={Heejin Kim and Mark Hasegawa-Johnson and Adrienne Perlman},
 title={Vowel Contrast and Speech Intelligibility in Dysarthria},
 doi={10.1159/000318881},
 journal={Folia Phoniatrica et Logopaedica},
 volume={63},
 number={4},
 pages={187-194},
 year={2011},
 grant={NIH DC0032301},
 keywords={analysis}
}

@article{kim2010frequency,
 author={Heejin Kim and Katie Martin and Mark Hasegawa-Johnson and Adrienne Perlman},
 title={Frequency of consonant articulation errors in dysarthric speech},
 doi={10.3109/02699206.2010.497238},
 url={https://www.tandfonline.com/doi/pdf/10.3109/02699206.2010.497238?casa_token=CjxOPSE_L_IAAAAA:EenLYvmMx1Da4-Sp69jHUVHNqTjMhVHxh3-ns6KPTlVx0kUadyZLad9i_kqgnaAeWTXsUViDvvE},
 journal={Clinical Linguistics \& Phonetics},
 volume={24},
 number={10},
 pages={759-770},
 year={2010},
 grant={NIH DC0032301},
 keywords={analysis}
}

@inproceedings{kim2010acoustic,
 author={Heejin Kim and Mark Hasegawa-Johnson and Adrienne Perlman},
 title={Acoustic Cues to Lexical Stress in Spastic Dysarthria},
 booktitle={Speech Prosody},
 url={https://www.isca-speech.org/archive/speechprosody_2010/kim10_speechprosody.html},
 year={2010},
 pages={100891:1-4},
 grant={NIH R21-DC008090-A},
 keywords={analysis}
}

@inproceedings{kim2010kinematic,
 author={Heejin Kim and Panying Rong and Torrey M. Loucks and Mark Hasegawa-Johnson},
 title={Kinematic Analysis of Tongue Movement Control in Spastic Dysarthria},
 booktitle={Proceedings of Interspeech},
 year={2010},
 pages={2578--2581},
 doi={10.21437/Interspeech.2010-697}, 
 grant={NSF 0534106},
 keywords={analysis}
}

@article{lin2013saliency-maximized,
 author={Kai-Hsiang Lin and Xiaodan Zhuang and Camille Goudeseune and Sarah King and Mark Hasegawa-Johnson and Thomas S. Huang},
 title={Saliency-Maximized Audio Visualization and Efficient Audio-Visual Browsing for Faster-than-Real-Time Human Acoustic Event Detection},
 doi={10.1145/2536764.2536773},
 journal={ACM Transactions on Applied Perception},
 grant={NSF 0807329},
 year={2013},
 keywords={analysis}
}

@inproceedings{goudeseune2012effective,
 author={Camille Goudeseune},
 year={2012},
 title={Effective browsing of long audio recordings},
 doi={10.1145/2390821.2390831},
 booktitle={ACM International Workshop on Interactive Multimedia on Mobile and Portable Devices},
 grant={NSF 0807329},
 software={https://github.com/camilleg/timeliner/blob/master/README.md},
 keywords={analysis}
}

@inproceedings{lin2012improving,
 author={Kai-Hsiang Lin and Xiaodan Zhuang and Camille Goudeseune and Sarah King and Mark Hasegawa-Johnson and Thomas Huang},
 title={Improving Faster-than-Real-Time Human Acoustic Event Detection by Saliency-Maximized Audio Visualization},
 doi={10.1109/ICASSP.2012.6288368},
 booktitle={ICASSP},
 year={2012},
 pages={2277-2280},
 grant={NSF 0807329},
 keywords={analysis}
}

@unpublished{cohen2009efficient,
 author={David Cohen and Camille Goudeseune and Mark Hasegawa-Johnson},
 year={2009},
 title={Efficient Simultaneous Multi-Scale Computation of FFTs},
 note={Georgia Tech publication GT-FODAVA-09-01},
 software={https://github.com/camilleg/multiscale-FFT},
 keywords={analysis}
}

@unpublished{petruncio2002evaluation,
 author={David Petruncio},
 title={Evaluation of Various Features for Music Genre Classification with Hidden Markov Models},
 note={B.S. Thesis, University of Illinois},
 year={2002},
 keywords={analysis}
}

@article{beauchamp2001acoustics,
 author={James Beauchamp and Heinrich Taube and Sever Tipei and Scott Wyatt and Lippold Haken and Mark Hasegawa-Johnson},
 title={Acoustics, Audio, and Music Technology Education at the University of Illinois},
 url={https://asa.scitation.org/doi/abs/10.1121/1.4776867},
 journal=jasa,
 volume={110},
 number={5},
 pages={2961},
 year={2001},
 keywords={analysis}
}

@inproceedings{hasegawa-johnson1999icppit,
 author={Mark Hasegawa-Johnson and Jul Cha and Shamala Pizza and Katherine Haker},
 title={CTMRedit: A case study in human-computer interface design},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=4bc8af525ca1f09e6cdc7c5399f382906d3a5365},
 booktitle={International Conference On Public Participation and Information Technology},
 address={Lisbon},
 pages={575-584},
 year={1999},
 grant={NIH DC0032301},
 keywords={analysis}
}

@phdthesis{serwy2017hilbert,
 author={Roger Serwy},
 title={Hilbert Phase Methods for Glottal Activity Detection},
 url={https://www.ideals.illinois.edu/items/102357},
 school={University of Illinois},
 year={2017},
 keywords={analysis}
}

@article{livescu2016speech,
 author={Karen Livescu and Frank Rudzicz and Eric Fosler-Lussier and Mark Hasegawa-Johnson and Jeff Bilmes},
 title={Speech Production in Speech Technologies: Introduction to the CSL Special Issue},
 doi={10.1016/j.csl.2015.11.002},
 journal={Computer Speech and Language},
 volume={36},
 pages={165-172},
 year={2016},
 keywords={analysis}
}

@inproceedings{chang2023classification,
  title={Classification of infant sleep/wake states: cross-attention among large scale pretrained transformer networks using audio, ECG, and IMU data},
  author={Chang, Kai Chieh and Hasegawa-Johnson, Mark and McElwain, Nancy L and Islam, Bashima},
  booktitle={2023 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)},
  pages={2370--2377},
  year={2023},
  organization={IEEE},
  doi={10.1109/APSIPAASC58517.2023.10317201},
  url={https://ieeexplore.ieee.org/iel7/10317071/10317095/10317201.pdf}
}

@inproceedings{andrew000105,
 author={Galen Andrew and Raman Arora and Sujeeth Bharadwaj and Jeff Bilmes and Mark Hasegawa-Johnson and Karen Livescu},
 title={Using articulatory measurements to learn better acoustic features},
 url={https://www.isca-speech.org/archive/spasr_2013/andrew13_spasr.html},
 booktitle={Proc. Workshop on Speech Production in Automatic Speech Recognition},
 address={Lyon, France},
 year={2013},
 keywords={analysis}
}

@inproceedings{juneja2013experiments,
 author={Amit Juneja and Mark Hasegawa-Johnson},
 title={Experiments on context-awareness and phone error propagation in human and machine speech recognition},
 url={https://www.isca-speech.org/archive/spasr_2013/juneja13_spasr.html},
 booktitle={Proc. Workshop on Speech Production in Automatic Speech Recognition},
 address={Lyon, France},
 year={2013},
 keywords={analysis}
}

@article{nam2015a,
 author={Hosung Nam and Vikramjit Mitra and Mark Tiede and Mark Hasegawa-Johnson and Carol Espy-Wilson and Elliot Saltzman and Louis Goldstein},
 title={A procedure for estimating gestural scores from speech acoustics},
 journal={J. Acoustical Society of America},
 volume={132},
 number={6},
 year={2012},
 doi={10.1121/1.4763545},
 pages={3980-3989},
 keywords={analysis}
}

@article{hasegawa-johnson2003vowel,
 author={Mark Hasegawa-Johnson and Shamala Pizza and Abeer Alwan and Jul Cha and Katherine Haker},
 title={Vowel Category Dependence of the Relationship Between Palate Height, Tongue Height, and Oral Area},
 doi={10.1044/1092-4388(2003/059)},
 journal={Journal of Speech, Language, and Hearing Research},
 volume={46},
 number={3},
 pages={738-753},
 year={2003},
 grant={NIH DC0032301},
 keywords={analysis}
}

@article{zheng2003parafac,
 author={Yanli Zheng and Mark Hasegawa-Johnson and Shamala Pizza},
 title={Analysis of the three-dimensional tongue shape using a three-index factor analysis model},
 doi={10.1121/1.1520538},
 journal={Journal of the Acoustical Society of America},
 volume={113},
 number={1},
 pages={478-486},
 month={January},
 year={2003},
 grant={NIH DC0032301},
 keywords={analysis}
}

@article{hasegawa-johnson2000line,
 author={Mark Hasegawa-Johnson},
 title={Line Spectral Frequencies are the Poles and Zeros of a Discrete Matched-Impedance Vocal Tract Model},
 doi={10.1121/1.429481},
 journal={Journal of the Acoustical Society of America},
 volume={108},
 number={1},
 pages={457-460},
 year={2000},
 grant={NIH DC0032301},
 keywords={analysis}
}

@article{zheng2000three,
 author={Yanli Zheng and Mark Hasegawa-Johnson},
 title={Three Dimensional Tongue shape Factor Analysis},
 journal={ASHA Leader},
 volume={5},
 number={16},
 pages={144},
 year={2000},
 grant={NIH 0032301},
 keywords={analysis}
}

@unpublished{hasegawa-johnson2001preliminary,
 author={Mark Hasegawa-Johnson},
 title={Preliminary Work and Proposed Continuation: Imaging of Speech Anatomy and Behavior.},
 note={Unpublished presentation at Universities of Illinois Inter-campus Biomedical Imaging Forum},
 year={2001},
 grant={NIH 0032301},
 keywords={analysis}
}

@inproceedings{hasegawa-johnson1999embs,
 author={Mark Hasegawa-Johnson and Jul Cha and Katherine Haker},
 title={CTMRedit: A Matlab-based tool for segmenting and interpolating MRI and CT images in three orthogonal planes},
 booktitle={21st Annual International Conference of the IEEE/EMBS Society},
 pages={1170},
 year={1999},
 grant={NIH 0032301},
 keywords={analysis}
}

@inproceedings{hasegawa-johnson1999combining,
 author={Mark Hasegawa-Johnson},
 title={Combining magnetic resonance image planes in the Fourier domain for improved spatial resolution},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=2444cdb69b01fcd889bfc3545f97637fbc330ac6},
 booktitle={International Conference On Signal Processing Applications and Technology},
 address={Orlando, FL},
 pages={81.1-5},
 year={1999},
 grant={NIH 0032301},
 keywords={analysis}
}

@article{hasegawa-johnson1998electromagnetic,
 author={Mark Hasegawa-Johnson},
 title={Electromagnetic Exposure Safety of the Carstens Articulograph AG100},
 doi={10.1121/1.423775},
 journal={Journal of the Acoustics Society of America},
 volume={104},
 pages={2529-2532},
 year={1998},
 grant={NIH 0032301},
 keywords={analysis}
}

@article{johnson1992using,
 author={Mark A. Johnson},
 title={Using beam elements to model the vocal fold length in breathy voicing},
 journal=jasa,
 volume={91},
 pages={2420-2421},
 year={1992},
 keywords={analysis}
}

@article{ni2019the,
 author={Junrui Ni and Mark Hasegawa-Johnson and Odette Scharenborg},
 title={The Time-Course of Phoneme Category Adaptation in Deep Neural Networks},
 doi={10.1007/978-3-030-31372-2_1},
 url={https://www.researchgate.net/profile/Odette_Scharenborg/publication/336096664_The_Time-Course_of_Phoneme_Category_Adaptation_in_Deep_Neural_Networks/links/5db0627e4585155e27f81326/The-Time-Course-of-Phoneme-Category-Adaptation-in-Deep-Neural-Networks.pdf},
 journal={Lecture Notes in Artificial Intelligence},
 volume={11816},
 pages={3-18},
 month={October},
 year={2019},
 keywords={analysis}
}

@article{yoon2009construction,
 author={Su-Youn Yoon and Lisa Pierce and Amanda Huensch and Eric Juul and Samantha Perkins and Richard Sproat and Mark Hasegawa-Johnson},
 title={Construction of a rated speech corpus of L2 learners' speech},
 url={https://www.jstor.org/stable/pdf/calicojournal.26.3.662.pdf?casa_token=fCpVdyBksEoAAAAA:n5lwoOcMttFqYjtsLvYeRcIoGOzjAy5r4_XDSZc4MWe4qPQzCpKEQXnpGTRzy2SyvsLWrcrzAl4Nki-4FPSj36-NIQSqcwffDoms1tPJ8Srti9W1tQ},
 journal={CALICO journal},
 year={2009},
 keywords={analysis}
}

@article{chang2007brain,
 author={Soo-Eun Chang and Nicoline Ambrose and Kirk Erickson and Mark Hasegawa-Johnson},
 title={Brain Anatomy Differences in Childhood Stuttering},
 doi={10.1016/j.neuroimage.2007.09.067},
 journal={Neuroimage},
 grant={NIH DC05210},
 keywords={analysis},
 year={2007}
}

@inproceedings{chang2006deficient,
 author={Soo-Eun Chang and Kirk I. Erickson and Nicoline G. Ambrose and Mark Hasegawa-Johnson and C.L. Ludlow},
 title={Deficient white matter development in left hemisphere speech-language regions in children who stutter},
 booktitle={Society for Neuroscience},
 address={Atlanta, GA},
 year={2006},
 grant={NIH DC05210},
 keywords={analysis}
}

@inproceedings{chang2004an,
 author={Soo-Eun Chang and Nicoline Ambrose and Mark Hasegawa-Johnson},
 title={An MRI (DTI) study on children with persistent developmental stuttering},
 booktitle={ASHA Convention},
 month={November},
 year={2004},
 keywords={analysis}
}

@inproceedings{scharenborg2019the,
 author={Odette Scharenborg and Jiska Koemans and Cybelle Smith and Mark A. Hasegawa-Johnson and Kara D. Federmeier},
 title={The Neural Correlates Underlying Lexically-Guided Perceptual Learning},
 booktitle={Proc. Interspeech},
 year={2019},
 pages={1223--1227},
 keywords={analysis},
  doi={10.21437/Interspeech.2019-2328} 
}

@inproceedings{pietrowicz2019dimensional,
 author={Mary Pietrowicz and Carla Agurto and Jonah Casebeer and Mark Hasegawa-Johnson and Karrie Karahalios and Guillermo Cecchi},
 title={Dimensional Analysis of Laughter in Female Conversational Speech},
 url={https://ieeexplore.ieee.org/abstract/document/8683566},
 booktitle={Proc. ICASSP},
 year={2019},
 pages={6600-6604},
 doi={10.1109/ICASSP.2019.8683566},
 keywords={analysis}
}

@article{chen2016mismatched,
 author={Wenda Chen and Mark Hasegawa-Johnson and Nancy F. Chen},
 title={Mismatched Crowdsourcing based Language Perception for Under-resourced Languages},
 journal={Procedia Computer Science},
 volume={81},
 pages={23--29},
 year={2016},
 doi={10.1016/j.procs.2016.04.025},
 keywords={analysis}
}

@inproceedings{xie2016landmark,
 author={Yanlu Xie and Mark Hasegawa-Johnson and Leyuan Qu and Jinsong Zhang},
 title={Landmark of Mandarin Nasal Codas and its Application in Pronunciation Error Detection},
 doi={10.1109/ICASSP.2016.7472703},
 booktitle={Proc. ICASSP},
 year={2016},
 keywords={analysis}
}

@article{kim2013automatic,
 author={Kyungtae Kim and Kai-Hsiang Lin and Dirk B Walther and Mark A Hasegawa-Johnson and Thomas S Huang},
 title={Automatic Detection of Auditory Salience with Optimized Linear Filters Derived from Human Annotation},
 doi={10.1016/j.patrec.2013.11.010},
 journal={Pattern Recognition Letters},
 volume={38},
 number={1},
 year={2013},
 pages={78-85},
 grant={NSF 0803219},
 keywords={analysis}
}

@article{lobdell2010intelligibility,
 author={Bryce E Lobdell and Jont B Allen and Mark A Hasegawa-Johnson},
 title={Intelligibility predictors and neural representation of speech},
 doi={10.1016/j.specom.2010.08.016},
 journal=jsc,
 keywords={analysis},
 year={2010}
}

@phdthesis{lobdell2009models,
 author={Bryce Lobdell},
 title={Models of Human Phone Transcription in Noise Based on Intelligibility Predictors},
 year={2009},
 url={https://hdl.handle.net/2142/81127},
 school={University of Illinois},
 keywords={analysis}
}

@article{mo2009how,
 author={Yoonsook Mo and Jennifer Cole and Mark Hasegawa-Johnson},
 title={How do ordinary listeners perceive prosodic prominence? Syntagmatic vs. Paradigmatic comparison.},
 doi={10.1121/1.4783760},
 journal=jasa,
 year={2009},
 volume={125},
 number={4},
 pages={2572},
 grant={NSF 0703624},
 keywords={analysis}
}

@inproceedings{lobdell2008human,
 author={Bryce Lobdell and Mark Hasegawa-Johnson and Jont B. Allen},
 title={Human Speech Perception and Feature Extraction},
 booktitle=interspeech,
 year={2008},
  pages={1797--1800},
  doi={10.21437/Interspeech.2008-494},
  keywords={analysis}
}

@inproceedings{mo2008frequency,
 author={Yoonsook Mo and Jennifer Cole and Mark Hasegawa-Johnson},
 title={Frequency and repetition effects outweigh phonetic detail in prominence perception},
 url={https://labphon.org/sites/default/files/previous_conferences/LabPhon11.pdf#page=51},
 booktitle={LabPhon 11},
 pages={29-30},
 year={2008},
 keywords={analysis}
}

@inproceedings{hasegawa-johnson2003bayesian,
 author={Mark Hasegawa-Johnson},
 title={Bayesian Learning for Models of Human Speech Perception},
 doi={10.1109/SSP.2003.1289432},
 booktitle={IEEE Workshop on Statistical Signal Processing},
 address={St. Louis, MO},
 year={2003},
 pages={393-396},
 grant={NSF 0132900},
 keywords={analysis}
}

@article{takayanagi1997information,
 author={Sumiko Takayanagi and Mark Hasegawa-Johnson and Laurie S. Eisner and Amy Schaefer-Martinez},
 title={Information theory and variance estimation techniques in the analysis of category rating data and paired comparisons},
 journal=jasa,
 volume={102},
 pages={3091},
 year={1997},
 keywords={analysis}
}

@inproceedings{kong2017landmark-based,
 author={Xiang Kong and Xuesong Yang and Jeung-Yoon Choi and Mark Hasegawa-Johnson and Stefanie Shattuck-Hufnagel},
 title={Landmark-based consonant voicing detection on multilingual corpora},
 doi={10.1121/1.4987203},
 url={https://arxiv.org/pdf/1611.03533.pdf},
 booktitle={Acoustics 17},
 address={Boston},
 month={June},
 year={2017},
 keywords={analysis}
}

@inproceedings{he2017selecting,
 author={Di He and Boon Pang Lim and Xuesong Yang and Mark Hasegawa-Johnson and Deming Chen},
 title={Selecting frames for automatic speech recognition based on acoustic landmarks},
 doi={10.1121/1.4987204},
 url={https://asa.scitation.org/doi/abs/10.1121/1.4987204},
 booktitle={Acoustics 17},
 address={Boston},
 month={June},
 year={2017},
 keywords={analysis}
}

@phdthesis{abunasser2015computational,
 author={Mahmoud Abunasser},
 title={Computational Measures of Linguistic Variation: A Study of Arabic Varieties},
 url={https://www.ideals.illinois.edu/items/79587},
 school={University of Illinois},
 year={2015},
 keywords={analysis}
}

@inproceedings{benmamoun2013how,
 author={Elabbas Benmamoun and Mark Hasegawa-Johnson},
 title={How Different are Arabic Dialects from Each Other and from Classical Arabic},
 booktitle={6th Annual Arabic Linguistics Symposium},
 isbn={9789027236180},
 address={Ifrane, Morocco},
 month={June},
 year={2013},
 keywords={analysis}
}

@inproceedings{nam2011automatic,
 author={Hosung Nam and Vikramjit Mitra and Mark Tiede and Mark Hasegawa-Johnson and Carol Espy-Wilson and Elliot Saltzman and Louis Goldstein},
 title={Automatic gestural annotation of the U. Wisconsin X-ray Microbeam corpus},
 booktitle={Workshop on New Tools and Methods for Very Large Scale Phonetics Research},
 publisher={University of Pennsylvania},
 month={Jan.},
 year={2011},
 keywords={analysis}
}

@inproceedings{zhuang2008the,
 author={Xiaodan Zhuang and Hosung Nam and Mark Hasegawa-Johnson and Louis Goldstein and Elliot Saltzman},
 title={The Entropy of Articulatory Phonological Code: Recognizing Gestures from Tract Variables},
  pages={1489--1492},
  doi={10.21437/Interspeech.2008-428},
  booktitle=interspeech,
 year={2008},
 grant={NSF 0703624},
 keywords={analysis}
}

@inproceedings{chitturi2006time,
 author={Rahul Chitturi and Mark Hasegawa-Johnson},
 title={Novel Time-Domain Multi-class SVMs for Landmark Detection},
 booktitle=interspeech,
 month={September},
 year={2006},
  pages={paper 1904-Thu1CaP.14},
  doi={10.21437/Interspeech.2006-105}, 
 keywords={analysis}
}

@article{gao2022domain,
  title={Domain Generalization for Language-Independent Automatic Speech Recognition},
  author={Gao, Heting and Ni, Junrui and Zhang, Yang and Qian, Kaizhi and Chang, Shiyu and Hasegawa-Johnson, Mark},
  journal={Frontiers in Artificial Intelligence},
  volume={5},
  pages={806274},
  year={2022},
  publisher={Frontiers Media SA},
  doi={10.3389/frai.2022.806274}
}

@inproceedings{chitturi2006entropy,
  author={Rahul Chitturi and Mark Hasegawa-Johnson},
  title={{Novel entropy based moving average refiners for HMM landmarks}},
  year=2006,
  booktitle={Proc. Interspeech 2006},
  pages={paper 1911-Wed1FoP.8},
  doi={10.21437/Interspeech.2006-468}
}

@inproceedings{hasegawajohnson00time,
  author={Mark Hasegawa-Johnson},
  title={{Time-frequency distribution of partial phonetic information measured using mutual information}},
  year=2000,
  booktitle={Proc. 6th International Conference on Spoken Language Processing (ICSLP 2000)},
  pages={vol. 4, 133-136},
  doi={10.21437/ICSLP.2000-769},
  keywords={analysis}
}

@article{hasegawajohnson1995burst,
 author={Mark A. Hasegawa-Johnson},
 title={Burst spectral measures and formant frequencies can be used to accurately discriminate stop place of articulation},
 doi={10.1121/1.414301},
 url={https://asa.scitation.org/doi/pdf/10.1121/1.414301},
 journal=jasa,
 volume={98},
 pages={2890},
 year={1995},
 keywords={analysis}
}

@article{johnson1994a,
 author={Mark A. Johnson},
 title={A mapping between trainable generalized properties and the acoustic correlates of distinctive features},
 journal={MIT Speech Communication Group Working Papers},
 volume={9},
 pages={94-105},
 year={1994},
 keywords={analysis}
}

@inproceedings{johnson1994automatic,
 author={Mark Johnson},
 title={Automatic context-sensitive measurement of the acoustic correlates of distinctive features},
  doi={10.21437/ICSLP.1994-424}, 
 booktitle={ICSLP},
 address={Yokohama},
 pages={1639-1643},
 year={1994},
 keywords={analysis}
}

@article{johnson1993a,
 author={Mark A. Johnson},
 title={A mapping between trainable generalized properties and the acoustic correlates of distinctive features},
 doi={10.1121/1.407629},
 url={https://asa.scitation.org/doi/pdf/10.1121/1.407629},
 journal=jasa,
 volume={94},
 pages={1865},
 year={1993},
 keywords={analysis}
}

@unpublished{hasegawajohnson2018unwritten,
 author={Mark Hasegawa-Johnson},
 title={Unwritten Languages as a Test Case for the Theory of Phonetic Universals},
 note={Plenary talk delivered at the International Symposium on Chinese Spoken Language Processing},
 year={2018},
 keywords={analysis}
}

@inproceedings{ozbek2009formant,
 author={I. Y\"{u}cel \"{O}zbek and Mark Hasegawa-Johnson and M\"{u}beccel Demirekler},
 title={Formant Trajectories for Acoustic-to-Articulatory Inversion},
 booktitle=interspeech,
 pages={2807--2810},
  doi={10.21437/Interspeech.2009-717},
  address={Brighton},
 month={September},
 year={2009},
 keywords={analysis}
}

@inproceedings{zheng2004stop,
 author={Yanli Zheng and Mark Hasegawa-Johnson and Sarah Borys},
 title={Stop Consonant Classification by Dynamic Formant Trajectory},
 booktitle=interspeech,
 pages={396-399},
 month={October},
 year={2004},
 grant={NSF 0132900},
 doi={10.21437/Interspeech.2004-403},
 keywords={analysis}
}

@inproceedings{zheng2004formant,
 author={Yanli Zheng and Mark Hasegawa-Johnson},
 title={Formant Tracking by Mixture State Particle Filter},
 doi={10.1109/ICASSP.2004.1326048},
 booktitle={ICASSP},
 year={2004},
 grant={NSF 0132900},
 keywords={analysis}
}

@inproceedings{zheng2003particle,
 author={Yanli Zheng and Mark Hasegawa-Johnson},
 title={Particle Filtering Approach to Bayesian Formant Tracking},
 doi={10.1109/SSP.2003.1289549},
 booktitle={IEEE Workshop on Statistical Signal Processing},
 month={September},
 year={2003},
 pages={581-584},
 grant={NSF 0132900},
 keywords={analysis}
}

@phdthesis{johnson1996formant,
 author={Mark A. Hasegawa-Johnson},
 title={Formant and Burst Spectral Measurements with Quantitative Error Models for Speech Sound Classification},
 url={https://dspace.mit.edu/handle/1721.1/10636},
 school={MIT},
 year={1996},
 keywords={analysis}
}

@inproceedings{zhang2016analysis,
 author={Yang Zhang and Gautham Mysore and Florian Berthouzoz and Mark Hasegawa-Johnson},
 title={Analysis of Prosody Increment Induced by Pitch Accents for Automatic Emphasis Correction},
 pages={79--83},
 doi={10.21437/SpeechProsody.2016-17},
 booktitle={Speech Prosody},
 year={2016},
 keywords={analysis}
}

@unpublished{hasegawajohnson2016speech,
 author={Mark Hasegawa-Johnson},
 title={Speech Production, Speech Perception, and Phonology},
 note={Lecture given at the Winter School on Speech and Audio Processing, Chennai, India},
 month={January},
 year={2016},
 keywords={analysis}
}

@unpublished{hasegawajohnson2016prosody,
 author={Mark Hasegawa-Johnson},
 title={Prosody},
 note={Lecture given at the Winter School on Speech and Audio Processing, Chennai, India},
 month={January},
 year={2016},
 keywords={analysis}
}

@unpublished{hasegawajohnson2016multivariate,
 author={Mark Hasegawa-Johnson},
 title={Multivariate-State Models for Speech Recognition},
 note={Lecture given at the Winter School on Speech and Audio Processing, Chennai, India},
 month={January},
 year={2016},
 keywords={analysis}
}

@unpublished{hasegawajohnson2016limited,
 author={Mark Hasegawa-Johnson},
 title={Limited Data Settings},
 note={Lecture given at the Winter School on Speech and Audio Processing, Chennai, India},
 month={January},
 year={2016},
 keywords={analysis}
}

@inproceedings{jyothi2014an,
 author={Preethi Jyothi and Jennifer Cole and Mark Hasegawa-Johnson and Vandana Puri},
 title={An Investigation of Prosody in Hindi Narrative Speech},
 doi={10.21437/SpeechProsody.2014-113},
 booktitle={Proceedings of Speech Prosody},
 year={2014},
 grant={QNRF 09-410-1-069},
 keywords={analysis}
}

@inproceedings{mahrt2012accounting,
 author={Tim Mahrt and Jennifer Cole and Margaret Fleck and Mark Hasegawa-Johnson},
 title={Accounting for Speaker Variation in the Production of Prominence using the Bayesian Information Criterion},
 url={https://www.isca-speech.org/archive/speechprosody_2012/mahrt12_speechprosody.html},
 booktitle={Speech Prosody},
 year={2012},
 grant={NSF 0703624},
 keywords={analysis}
}

@inproceedings{mahrt2011optimal,
 author={Tim Mahrt and Jui-Ting Huang and Yoonsook Mo and Margaret Fleck and Mark Hasegawa-Johnson and Jennifer Cole},
 title={Optimal models of prosodic prominence using the Bayesian information criterion},
 booktitle={Proc. Interspeech},
 pages={2037--2040},
 doi={10.21437/Interspeech.2011-535}, 
 year={2011},
 keywords={analysis}
}

@inproceedings{mahrt12_interspeech,
  author={Tim Mahrt and Jennifer Cole and Margaret Fleck and Mark Hasegawa-Johnson},
  title={{F0 and the perception of prominence}},
  year=2012,
  booktitle={Proc. Interspeech 2012},
  pages={2422--2425},
  doi={10.21437/Interspeech.2012-634}
}

@inproceedings{mo2010prosodic,
 author={Yoonsook Mo and Jennifer Cole and Mark Hasegawa-Johnson},
 title={Prosodic effects on temporal structure of monosyllabic CVC words in American English},
 booktitle={Speech Prosody},
 url={https://www.isca-speech.org/archive/speechprosody_2010/mo10_speechprosody.html},
 year={2010},
 pages={100208:1-4},
 grant={NSF 0703624},
 keywords={analysis}
}

@article{cole2007signal-based,
 author={Jennifer Cole and Yoonsook Mo and Mark Hasegawa-Johnson},
 title={Signal-based and expectation-based factors in the perception of prosodic prominence},
 doi={10.1515/labphon.2010.022},
 journal={Journal of Laboratory Phonology},
 grant={NSF 0703624)},
 year={2007},
 keywords={analysis}
}

@inproceedings{mo2009prosodic,
 author={Yoonsook Mo and Jennifer Cole and Mark Hasegawa-Johnson},
 title={Prosodic effects on vowel production: evidence from formant structure},
 doi={10.21437/Interspeech.2009-668},
 booktitle=interspeech,
  pages={2535--2538},
 address={Brighton},
 month={September},
 year={2009},
 grant={NSF 0703624},
 keywords={analysis}
}

@inproceedings{yoon000168on,
 author={Taejin Yoon and Jennifer Cole and Mark Hasegawa-Johnson},
 title={On the edge: Acoustic cues to layered prosodic domains},
 url={http://www.icphs2007.de/conference/Papers/1264/1264.pdf},
 booktitle={Proc. International Congress on Phonetic Sciences (ICPhS)},
 pages={1264:1017-1020},
 address={Saarbrücken},
 month={August},
 year={2007},
 grant={NSF 0414117},
 keywords={analysis}
}

@inproceedings{hasegawajohnson12_speechprosody,
  author={Mark Hasegawa-Johnson and Elabbas Benmamoun and Eiman Mustafawi and Mohamed Elmahdy and Rehab Duwairi},
  title={{On the definition of the word “segmental”}},
  year=2012,
  booktitle={Proc. Speech Prosody 2012},
  pages={159--162},
  url={https://www.isca-speech.org/archive/speechprosody_2012/hasegawajohnson12_speechprosody.html}
}

@inproceedings{yoon2007on,
 author={Taejin Yoon and Jennifer Cole and Mark Hasegawa-Johnson},
 title={On the edge: Acoustic cues to layered prosodic domains.},
 url={http://www.icphs2007.de/conference/Papers/1264/1264.pdf},
 booktitle={81st Annual Meeting of the Linguistic Society of America},
 address={Anaheim, CA},
 month={January},
 year={2007},
 grant={NSF 0414117},
 keywords={analysis}
}

@article{cole2007prosodic,
 author={Jennifer Cole and Heejin Kim and Hansook Choi and Mark Hasegawa-Johnson},
 title={Prosodic effects on acoustic cues to stop voicing and place of articulation: Evidence from Radio News speech},
 doi={10.1016/j.wocn.2006.03.004},
 journal={J Phonetics},
 volume={35},
 pages={180-209},
 year={2007},
 grant={NSF 0414117},
 keywords={analysis}
}

@inproceedings{kim2006acoustic,
 author={Heejin Kim and Taejin Yoon and Jennifer Cole and Mark Hasegawa-Johnson},
 title={Acoustic differentiation of L- and L-L\% in Switchboard and Radio News speech},
 url={https://www.isca-speech.org/archive/speechprosody_2006/kim06d_speechprosody.html},
 booktitle={Proceedings of Speech Prosody},
 year={2006},
 address={Dresden},
 grant={NSF 0414117},
 keywords={analysis}
}

@unpublished{reddy2006thesis,
 author={Rajiv Reddy},
 title={Analysis of Pitch Contours in Repetition-Disfluency Using Stem-ML},
 howpublished={B.S. Thesis, University of Illinois},
 year={2006},
 keywords={analysis}
}

@unpublished{yoon2005mapping,
 author={Taejin Yoon},
 title={Mapping Syntax and Prosody},
 note={Presentation at the Midwest Computational Linguistics Colloquium},
 address={Columbus, OH},
 year={2005},
 grant={NSF 0414117},
 keywords={analysis}
}

@article{choi2005finding,
 author={Jeung-Yoon Choi and Mark Hasegawa-Johnson and Jennifer Cole},
 title={Finding Intonational Boundaries Using Acoustic Cues Related to the Voice Source},
 doi={10.1121/1.2010288},
 journal={Journal of the Acoustical Society of America},
 volume={118},
 number={4},
 pages={2579-88},
 year={2005},
 keywords={analysis}
}

@inproceedings{cole2005prosodic,
 author={Jennifer Cole and Mark Hasegawa-Johnson and Chilin Shih and Eun-Kyung Lee and Heejin Kim and H. Lu and Yoonsook Mo and Tae-Jin Yoon},
 year={2005},
 title={Prosodic Parallelism as a Cue to Repetition and Hesitation Disfluency},
 url={https://www.isca-speech.org/archive/diss_2005/cole05_diss.html},
 booktitle={Disfluency In Spontaneous Speech (DISS'05)},
 address={Aix-en-Provence, France},
 pages={53-58},
 grat={NSF 0414117},
 keywords={analysis}
}

@inproceedings{yoon2004intertranscriber,
 author={Tae-Jin Yoon and Sandra Chavarria and Jennifer Cole and Mark Hasegawa-Johnson},
 title={Intertranscriber Reliability of Prosodic Labeling on Telephone Conversation Using ToBI},
 booktitle=interspeech,
 month={October},
 year={2004},
 pages={2729--2732},
 doi={10.21437/Interspeech.2004-659},
 keywords={analysis}
}

@inproceedings{yoon2004local,
 author={Tae-Jin Yoon and Heejin Kim and Sandra Chavarría.},
 title={Local Acoustic Cues Distinguishing Two Levels of prosodic Phrasing: Speech Corpus Evidence},
 url={https://www.researchgate.net/profile/Tae-Jin-Yoon/publication/238592404_Local_Acoustic_Cues_Distinguish_Two_Levels_of_Prosodic_Phrasing_Speech_Corpus_Evidence/links/5575664408ae753637500253/Local-Acoustic-Cues-Distinguish-Two-Levels-of-Prosodic-Phrasing-Speech-Corpus-Evidence.pdf},
 booktitle={Labphon 9},
 address={University of Illinois at Urbana-Champaign},
 year={2004},
 keywords={analysis}
}

@inproceedings{kim2004the,
 author={Heejin Kim and Jennifer Cole and Hansook Choi and Mark Hasegawa-Johnson},
 title={The Effect of Accent on Acoustic Cues to Stop Voicing and Place of Articulation in Radio News Speech},
 url={https://www.isca-speech.org/archive/speechprosody_2004/kim04_speechprosody.html},
 booktitle={SpeechProsody},
 year={2004},
 address={Nara, Japan},
 month={March},
 pages={29-32},
 keywords={analysis}
}

@inproceedings{chavarria000179acoustic,
 author={Sandra Chavarria and Taejin Yoon and Jennifer Cole and Mark Hasegawa-Johnson},
 title={Acoustic differentiation of ip and IP boundary levels: Comparison of L- and L-L\% in the Switchboard corpus},
 url={https://www.isca-speech.org/archive/speechprosody_2004/chavarria04_speechprosody.html},
 booktitle={Speech Prosody},
 year={2004},
 address={Nara, Japan},
 month={March},
 pages={333-336},
 keywords={analysis}
}

@inproceedings{cole000180the,
 author={Jennifer Cole and Hansook Choi and Heejin Kim and Mark Hasegawa-Johnson},
 title={The effect of accent on the acoustic cues to stop voicing in Radio News speech},
 url={https://www.internationalphoneticassociation.org/icphs-proceedings/ICPhS2003/papers/p15_2665.pdf},
 booktitle={ICPhS},
 year={2003},
 pages={2665-2668},
 keywords={analysis}
}

@article{johnson1992analysis,
 author={Mark A. Johnson},
 title={Analysis of durational rhythms in two poems by Robert Frost},
 journal={MIT Speech Communication Group Working Papers},
 volume={8},
 pages={29-42},
 year={1992},
 keywords={analysis}
}

@unpublished{borys2008lovable,
 author={Sarah Borys},
 title={Lovable Indestructible Grad Student of Chaos},
 year={2008},
 note={Cartoons published online},
 keywords={analysis}
}

@phdthesis{borys2009lovable,
 author={Sarah Borys},
 title={Lovable Indestructible Grad Student of Chaos},
 school={University of Illinois},
 year={2009},
 keywords={analysis}
}

@article{ozbek2011on,
 author={İ. Yücel Ozbek and Mark Hasegawa-Johnson and Mübeccel Demirekler},
 title={On Improving Dynamic State Space Approaches to Articulatory Inversion with MAP based Parameter Estimation},
 doi={10.1109/TASL.2011.2157496},
 volume={20},
 number={1},
 pages={67--81},
 journal={IEEE Transactions on Audio, Speech, and Language},
 year={2011},
 keywords={analysis}
}

@article{ozbek2011estimation,
 author={İ. Yücel Ozbek and Mark Hasegawa-Johnson and Mübeccel Demirekler},
 title={Estimation of Articulatory Trajectories Based on Gaussian Mixture Model (GMM) with Audio-Visual Information Fusion and Dynamic Kalman Smoothing},
 doi={10.1109/TASL.2010.2087751},
 journal={IEEE Transactions on Audio, Speech, and Language},
 volume={19},
 number={5},
 pages={1180-1195},
 year={2011},
 keywords={analysis}
}

@inproceedings{hasegawajohnson000187mismatched,
 author={Mark Hasegawa-Johnson and Preethi Jyothi and Wenda Chen and Van Hai Do},
 title={Mismatched Crowdsourcing: Mining Latent Skills to Acquire Speech Transcriptions},
 doi={10.1109/ACSSC.2017.8335558},
 booktitle={Proceedings of Asilomar},
 year={2017},
 grant={DARPA LORELEI},
 keywords={analysis}
}

@inproceedings{hai2016analysis,
 author={Van Hai Do and Nancy F. Chen and Boon Pang Lim and Mark Hasegawa-Johnson},
 title={Analysis of Mismatched Transcriptions Generated by Humans and Machines for Under-Resourced Languages},
 booktitle=interspeech,
 year={2016},
 keywords={analysis},
 pages={3863--3867},
  doi={10.21437/Interspeech.2016-736} 
}

@article{kong2016performance,
 author={Xiang Kong and Preethi Jyothi and Mark Hasegawa-Johnson},
 title={Performance Improvement of Probabilistic Transcriptions with Language-specific Constraints.},
 url={http://www.sciencedirect.com/science/article/pii/S1877050916300400},
 journal={Procedia Computer Science},
 volume={81},
 pages={30-36},
 year={2016},
 doi={10.1016/j.procs.2016.04.026},
 grant={DARPA LORELEI},
 keywords={analysis}
}

@inproceedings{varshney2016language,
 author={Lav Varshney and Preethi Jyothi and Mark Hasegawa-Johnson},
 title={Language Coverage for Mismatched Crowdsourcing},
 doi={10.1109/ITA.2016.7888198},
 booktitle={Workshop on Information Theory and Applications},
 year={2016},
 grant={NSF 1550145},
 keywords={analysis}
}

@inproceedings{yeh2022equivariance,
 author={Raymond Yeh and Mark Hasegawa-Johnson and Alexander Schwing},
 title={Equivariance Discovery by Learned Parameter-Sharing},
 url={https://proceedings.mlr.press/v151/yeh22b/yeh22b.pdf},
 booktitle={AISTATS},
 year={2022},
 keywords={intelligence}
}

@inproceedings{shi2021continuous,
 author={Hui Shi and Yang Zhang and Hao Wu and Shiyu Chang and Kaizhi Qian and Mark Hasegawa-Johnson and Jishen Zhao},
 title={Continuous CNN for Nonuniform Time Series},
 doi={10.1109/ICASSP39728.2021.9414318},
 booktitle={Proc. ICASSP},
 year={2021},
 keywords={intelligence}
}

@inproceedings{chang2017dilated,
 author={Shiyu Chang and Yang Zhang and Wei Han and Mo Yu andXiaoxiao Guo and Wei Tan and Xiaodong Cui and Michael Witbrock and Mark Hasegawa-Johnson and Thomas Huang},
 title={Dilated Recurrent Neural Networks},
 url={https://papers.nips.cc/paper/6613-dilated-recurrent-neural-networks.pdf},
 booktitle={NIPS},
 year={2017},
 keywords={intelligence}
}

@inproceedings{chang2017streaming,
 author={Shiyu Chang and Yang Zhang and Jiling Tang and Dawei Yin and Yi Chang and Mark Hasegawa-Johnson and Thomas Huang},
 title={Streaming Recommender Systems},
 doi={10.1145/3038912.3052627},
 booktitle={WWW 2017},
 pages={381--389},
 year={2017},
 keywords={intelligence}
}

@inproceedings{chang2016positive-unlabeled,
 author={Shiyu Chang and Yang Zhang and Jiliang Tang and Dawei Lin and Yi Chang and Mark Hasegawa-Johnson and Thomas Huang},
 title={Positive-Unlabeled Learning in Streaming Networks},
 pages={755-764},
 url={http://www.kdd.org/kdd2016/subtopic/view/positive-unlabeled-learning-in-streaming-networks},
 booktitle={KDD},
 year={2016},
 keywords={intelligence}
}

@inproceedings{yeh2016stable,
 author={Raymond Yeh and Mark Hasegawa-Johnson and Minh Do},
 title={Stable and Symmetric Filter Convolutional Neural Network},
 doi={10.1109/ICASSP.2016.7472158},
 pages={2652-2656},
 booktitle={Proc. ICASSP},
 year={2016},
 keywords={intelligence}
}

@article{omar2004model,
 author={Mohammad Kamal Omar and Mark Hasegawa-Johnson},
 title={Model Enforcement: A Unified Feature Transformation Framework for Classification and Recognition},
 doi={10.1109/TSP.2004.834344},
 journal={IEEE Transactions on Signal Processing},
 volume={52},
 number={10},
 pages={2701-2710},
 year={2004},
 grant={NSF 0132900},
 keywords={intelligence}
}

@inproceedings{yoon2022smsmix,
 author={Hee Suk Yoon and Eunseop Yoon and John Harvill and Sunjae Yoon and Mark Hasegawa-Johnson and Chang D. Yoo},
 title={{SMSMix}: Sense Maintained Sentence Mixup for Word Sense Disambiguation},
 booktitle={EMNLP},
 url={https://aclanthology.org/2022.findings-emnlp.107.pdf},
 month={12},
 year={2022},
 pages={1493–1502},
 keywords={intelligence}
}

@inproceedings{harvill2022syn2vec:,
 author={John Harvill and Roxana Girju and Mark Hasegawa-Johnson},
 title={{Syn2Vec}: Synset Colexification Graphs for Lexical Semantic Similarity},
 url={https://aclanthology.org/2022.naacl-main.386/},
 pages={5259–5270},
 doi={10.18653/v1/2022.naacl-main.386},
 booktitle={Proc. NAACL},
 year={2022},
 keywords={intelligence}
}

@inproceedings{ramnath2021worldly,
 author={Kiran Ramnath and Leda Sarı and Mark Hasegawa-Johnson and Chang Yoo},
 title={Worldly Wise (WoW) - Cross-Lingual Knowledge Fusion for Fact-based Visual Spoken-Question Answering},
 doi={10.18653/v1/2021.naacl-main.153},
 booktitle={Proc. NAACL},
 year={2021},
 pages={1908–1919},
 keywords={intelligence}
}

@inproceedings{bharadwaj2014a,
 author={Sujeeth Bharadwaj and Mark Hasegawa-Johnson},
 title={A {PAC-Bayesian} Approach to Minimum Perplexity Language Modeling},
 url={https://aclanthology.org/C14-1014.pdf},
 pages={130-140},
 booktitle={Proceedings of CoLing},
 year={2014},
 grant={NSF 0941268},
 keywords={intelligence}
}

@inproceedings{wang2021interpretable,
 author={Zhonghao Wang and Mo Yu and Kai Wang and Jinjun Xiaong and Wen-mei Hwu and Mark Hasegawa-Johnson and Humphrey Shi},
 title={Interpretable Visual Reasoning via Induced Symbolic Space},
 pages={1878-1887},
 url={https://openaccess.thecvf.com/content/ICCV2021/html/Wang_Interpretable_Visual_Reasoning_via_Induced_Symbolic_Space_ICCV_2021_paper.html},
 booktitle={ICCV},
 year={2021},
 keywords={intelligence}
}

@inproceedings{yeh2018image,
 author={Raymond A. Yeh and Teck Yian Lim and Chen Chen and Alexander G. Schwing and Mark Hasegawa-Johnson and Minh N. Do},
 year={2018},
 title={Image Restoration with Deep Generative Models},
 url={https://ieeexplore.ieee.org/abstract/document/8462317},
 booktitle={Proc. IEEE ICASSP},
 pages={6772-6772},
 doi={10.1109/ICASSP.2018.8462317},
 keywords={intelligence}
}

@inproceedings{yeh2017semantic,
 author={Raymond Yeh and Chen Chen and Teck Yian Lim and Alexander G. Schwing and Mark Hasegawa-Johnson and Minh N. Do},
 title={Semantic Image Inpainting with Deep Generative Networks},
 pages={5485-5493},
 url={https://openaccess.thecvf.com/content_cvpr_2017/html/Yeh_Semantic_Image_Inpainting_CVPR_2017_paper},
 booktitle={CVPR},
 year={2017},
 keywords={intelligence}
}

@inproceedings{lin2014foreground,
 author={Kai-Hsiang Lin and Pooya Khorrami and Jiangping Wang and Mark Hasegawa-Johnson and Thomas S. Huang},
 title={Foreground Object Detection in Highly Dynamic Scenes Using Saliency},
 booktitle={Proceedings of ICIP},
 doi={10.1109/ICIP.2014.7025224},
 pages={1125-1129},
 year={2014},
 keywords={intelligence}
}

@inproceedings{wang2014active,
 author={Zhaowen Wang and Zhangyang Wang and Mark Moll and Po-Sen Huang and Devin Grady and Nasser Nasrabadi and Thomas Huang and Lydia Kavraki and Mark Hasegawa-Johnson},
 title={Active Planning, Sensing and Recognition Using a Resource-Constrained Discriminant POMDP},
 pages={740-747},
 url={https://www.cv-foundation.org/openaccess/content_cvpr_workshops_2014/W19/html/Wang_Active_Planning_Sensing_2014_CVPR_paper.html},
 booktitle={CVPR Multi-Sensor Fusion Workshop},
 year={2014},
 grant={ARO W911NF-09-1-0383},
 keywords={intelligence}
}

@article{zhou2010novel,
 author={Xi Zhou and Xiaodan Zhuang and Hao Tang and Mark A. Hasegawa-Johnson and Thomas S. Huang},
 title={Novel Gaussianized Vector Representation for Improved Natural Scene Categorization},
 doi={10.1016/j.patrec.2009.12.010},
 journal={Pattern Recognition Letters},
 volume={31},
 number={8},
 month={Jun.},
 year={2010},
 pages={702-708},
 grant={NSF 0807329},
 keywords={intelligence}
}

@inproceedings{tang2010non-frontal,
 author={Hao Tang and Mark Hasegawa-Johnson and Thomas S. Huang},
 title={Non-Frontal View Facial Expression Recognition},
 doi={10.1109/ICME.2010.5582576},
 booktitle={ICME},
 year={2010},
 pages={1202-1207},
 keywords={intelligence}
}

@inproceedings{zhuang2009efficient,
 author={Xiaodan Zhuang and Xi Zhou and Mark A. Hasegawa-Johnson and Thomas S. Huang},
 title={Efficient Object Localization with Gaussianized Vector Representation},
 doi={10.1145/1631040.1631055},
 booktitle={IMCE},
 year={2009},
 pages={89-96},
 grant={NSF 0803219},
 keywords={intelligence}
}

@inproceedings{zhuang2008face,
 author={Xiaodan Zhuang and Xi Zhou and Mark Hasegawa-Johnson and Thomas Huang},
 title={Face Age Estimation Using Patch-based Hidden Markov Model Supervectors},
 doi={10.1109/ICPR.2008.4761364},
 booktitle={ICPR},
 year={2008},
 pages={1-4},
 grant={NSF 0534106},
 keywords={intelligence}
}

@inproceedings{zhou2008a,
 author={Xi Zhou and Xiaodan Zhuang and Hao Tang and Mark Hasegawa-Johnson and Thomas Huang},
 title={A Novel Gaussianized Vector Representation for Natural Scene Categorization},
 doi={10.1109/ICPR.2008.4761665},
 booktitle={ICPR},
 year={2008},
 pages={1-4},
 grant={NSF 0534106},
 keywords={intelligence}
}

@inproceedings{zhou2008sift-bag,
 author={Xi Zhou and Xiaodan Zhuang and Shuicheng Yan and Shih-Fu Chang and Mark Hasegawa-Johnson and Thomas S. Huang},
 title={SIFT-Bag Kernel for Video Event Analysis},
 doi={10.1145/1459359.1459391},
 booktitle={ACM Multimedia},
 year={2008},
 pages={229-238},
 grant={NSF 0534106},
 keywords={intelligence}
}

@inproceedings{yan2008regression,
 author={Shuicheng Yan and Xi Zhou and Ming Liu and Mark Hasegawa-Johnson and Thomas S. Huang},
 title={Regression from Patch Kernel},
 doi={10.1109/CVPR.2008.4587405},
 url={http://ieeexplore.ieee.org/xpl/freeabs_all.jsp?arnumber=4587405},
 booktitle={IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year={2008},
 pages={1-8},
 keywords={intelligence}
}

@inproceedings{yoon2023mitigating,
 author={Eunseop Yoon and Hee Suk Yoon and Dhananjaya Gowda and SooHwan Eom and Daehyeok Kim and John Harvill and Heting Gao and Mark Hasegawa-Johnson and Chanwoo Kim and Chang D. Yoo},
 title={Mitigating the Exposure Bias in Sentence-Level Grapheme-to-Phoneme {(G2P)} Transduction},
 booktitle=interspeech,
 year={2023},
 keywords={recognition}
}

@article{li2022autosegmental,
 author={Jialu Li and Mark Hasegawa-Johnson},
 title={Autosegmental Neural Nets 2.0: An Extensive Study of Training Synchronous and Asynchronous Phones and Tones for Under-Resourced Tonal Languages},
 url={https://ieeexplore.ieee.org/abstract/document/9783062},
 journal={IEEE Transactions on Audio, Speech and Language},
 volume={30},
 pages={1918-1926},
 month={5},
 year={2022},
 doi={10.1109/TASLP.2022.3178238},
 keywords={recognition}
}

@article{gao2022seamless,
 author={Heting Gao and Xiaoxuan Wang and Sunghun Kang and Rusty Mina and Dias Issa and John Harvill and Leda Sar\i and Mark Hasegawa-Johnson and Chang D. Yoo},
 title={Seamless Equal Accuracy Ratio for Inclusive CTC Speech Recognition},
 doi={10.1016/j.specom.2021.11.004},
 journal=jsc,
 volume={136},
 pages={76-83},
 year={2022},
 keywords={recognition}
}

@article{sari2021counterfactually,
 author={Leda Sarı and Mark Hasegawa-Johnson and Chang D. Yoo},
 title={Counterfactually Fair Automatic Speech Recognition},
 journal={IEEE Transactions on Audio, Speech, and Language},
 volume={29},
 pages={3515-3525},
 year={2021},
 doi={10.1109/TASLP.2021.3126949},
 keywords={recognition}
}

@inproceedings{gao2021zero-shot,
 author={Heting Gao and Junrui Ni and Yang Zhang and Kaizhi Qian and Shiyu Chang and Mark Hasegawa-Johnson},
 title={Zero-shot Cross-Lingual Phonetic Recognition with External Language Embedding},
 booktitle={Proc. Interspeech},
 year={2021},
 keywords={recognition},
  pages={1304--1308},
  doi={10.21437/Interspeech.2021-1843} 
}

@inproceedings{sari2022auxiliary,
 author={Leda Sarı and Mark Hasegawa-Johnson and Samuel Thomas},
 title={Auxiliary Networks for Joint Speaker Adaptation and Speaker Change Detection},
 doi={10.1109/TASLP.2020.3040626},
 pages={324-333},
 volume={29},
 booktitle={IEEE Transactions on Audio, Speech, and Language},
 keywords={recognition},
 year={2022}
}

@article{hasegawajohnson2020grapheme-to-phoneme,
 author={Mark Hasegawa-Johnson and Leanne Rolston and Camille Goudeseune and Gina-Anne Levow and Katrin Kirchhoff},
 title={Grapheme-to-Phoneme Transduction for Cross-Language ASR},
 doi={10.1007/978-3-030-59430-5_1},
 journal={Lecture Notes in Computer Science},
 volume={12379},
 pages={3-19},
 year={2020},
 keywords={recognition}
}

@inproceedings{li2020autosegmental,
 author={Jialu Li and Mark Hasegawa-Johnson},
 title={Autosegmental Neural Nets: Should Phones and Tones be Synchronous or Asynchronous?},
 url={http://arxiv.org/abs/2007.14351},
 booktitle={Proc. Interspeech},
 year={2020},
 keywords={recognition},
 pages={1027--1031},
  doi={10.21437/Interspeech.2020-1834} 
}

@inproceedings{zelasko2020that,
 year={2020},
 keywords={recognition},
 author={Piotr Żelasko and Laureano Moro-Velázquez and Mark Hasegawa-Johnson and Odette Scharenborg and Najim Dehak},
 title={{That Sounds Familiar: An Analysis of Phonetic Representations Transfer Across Languages}},
 booktitle={Proc. Interspeech 2020},
 pages={3705--3709},
 doi={10.21437/Interspeech.2020-2513}
} 

@inproceedings{sar19_interspeech,
  author={Leda Sarı and Samuel Thomas and Mark A. Hasegawa-Johnson},
  title={{Learning Speaker Aware Offsets for Speaker Adaptation of Neural Networks}},
  year=2019,
  booktitle={Proc. Interspeech 2019},
  pages={769--773},
  doi={10.21437/Interspeech.2019-1788}
}

@inproceedings{he2150when,
 author={Di He and Xuesong Yang and Boon Pang Lim and Yi Liang and Mark Hasegawa-Johnson and Deming Chen},
 title={When CTC Training Meets Acoustic Landmarks},
 doi={10.1109/ICASSP.2019.8683607},
 booktitle={ICASSP},
 year={2019},
 pages={5996-6000},
 keywords={recognition}
}

@article{hai2018multitask,
 author={Van Hai Do and Nancy F. Chen and Boon Pang Lim and Mark Hasegawa-Johnson},
 title={Multitask Learning for Phone Recognition of Underresourced Languages Using Mismatched Transcription},
 url={https://dl.acm.org/citation.cfm?id=3180760},
 journal={IEEE/ACM Transactions on Audio, Speech and Language Processing (TASLP)},
 volume={26},
 number={3},
 month={March},
 year={2018},
 pages={501-514},
 doi={10.1109/TASLP.2017.2782360},
 keywords={recognition}
}

@inproceedings{do17_interspeech,
  author={Van Hai Do and Nancy F. Chen and Boon Pang Lim and Mark Hasegawa-Johnson},
  title={{Multi-Task Learning Using Mismatched Transcription for Under-Resourced Speech Recognition}},
  year=2017,
  booktitle={Proc. Interspeech 2017},
  pages={734--738},
  doi={10.21437/Interspeech.2017-788}
}

@inproceedings{li2018a,
 author={Jialu Li and Mark Hasegawa-Johnson},
 title={A Comparable Phone Set for the TIMIT Dataset Discovered in Clustering of Listen, Attend and Spell},
 booktitle={NeurIPS Workshop on Interpretability and Robustness in Audio, Speech, and Language},
 year={2018},
 keywords={recognition}
}

@inproceedings{scharenborg2018visualizing,
 author={Odette Scharenborg and Sebastian Tiesmeyer and Mark Hasegawa-Johnson and Najim Dehak},
 title={Visualizing Phoneme Category Adaptation in Deep Neural Networks},
 booktitle={Proc. Interspeech},
 year={2018},
 pages={1482--1486},
 doi={10.21437/Interspeech.2018-1707},
 keywords={recognition}
}

@inproceedings{sari2018mlslp,
 author={Leda Sari and Mark Hasegawa-Johnson},
 title={Speaker Adaptation with an Auxiliary Network},
 booktitle={MLSLP (ISCA Workshop on Machine Learning for Speech and Language Processing)},
 year={2018},
 keywords={recognition}
}

@inproceedings{he2018improved,
 author={Di He and Boon Pang Lim and Xuesong Yang and Mark Hasegawa-Johnson and Deming Chen},
 title={Improved ASR for under-resourced languages through Multi-task Learning with Acoustic Landmarks},
 booktitle={Proc. Interspeech},
 year={2018},
 pages={2618--2622},
 doi={10.21437/Interspeech.2018-1124},
 keywords={recognition}
}

@phdthesis{das2018speech,
 author={Amit Das},
 title={Speech Recognition with Probabilistic Transcriptions and End-to-End Systems Using Deep Learning},
 url={https://www.ideals.illinois.edu/items/109828},
 school={University of Illinois},
 year={2018},
 keywords={recognition}
}

@inproceedings{das2018improving,
 author={Amit Das and Mark Hasegawa-Johnson},
 title={Improving DNNs Trained With Non-Native Transcriptions Using Knowledge Distillation and Target Interpolation},
 booktitle={Proc. Interspeech},
 year={2018},
 pages={2434--2438},
 doi={10.21437/Interspeech.2018-1450},
 keywords={recognition}
}

@inproceedings{ondel2018bayesian,
 author={Lucas Ondel and Pierre Godard and Laurent Besacier and Elin Larsen and Mark Hasegawa-Johnson and Odette Scharenborg and Emmanuel Dupoux and Lukas Burget and François Yvon and Sanjeev Khudanpur},
 title={Bayesian Models for Unit Discovery on a Very Low Resource Language},
 doi={10.1109/ICASSP.2018.8461545},
 pages={5939-5943},
 booktitle={Proc. ICASSP},
 year={2018},
 keywords={recognition}
}

@inproceedings{chen2018recognizing,
 author={Wenda Chen and Mark Hasegawa-Johnson and Nancy Chen},
 title={Recognizing Zero-resourced Languages based on Mismatched Machine Transcriptions},
 url={https://ieeexplore.ieee.org/abstract/document/8462481},
 booktitle={Proc. ICASSP},
 year={2018},
 pages={5979-5983},
 doi={10.1109/ICASSP.2018.8462481},
 keywords={recognition}
}

@inproceedings{yang2018joint,
 author={Xuesong Yang and Kartik Audhkhasi and Andrew Rosenberg and Samuel Thomas and Bhuvana Ramabhadran and Mark Hasegawa-Johnson},
 title={Joint Modeling of Accents and Acoustics for Multi-Accent Speech Recognition},
 url={https://ieeexplore.ieee.org/abstract/document/8462557},
 booktitle={Proc. ICASSP},
 year={2018},
 pages={5989-5993},
 doi={10.1109/ICASSP.2018.8462557},
 keywords={recognition}
}

@inproceedings{scharenborg2017building,
 author={Odette Scharenborg and Francesco Ciannella and Shruti Palaskar and Alan Black and Florian Metze and Lucas Ondel and Mark Hasegawa-Johnson},
 title={Building an ASR System for a Low-Resource Language Through the Adaptation of a High-Resource Language ASR System: Preliminary Results},
 url={https://www.researchgate.net/profile/Kamel-Smaili-2/publication/354824671_Proceedings_of_the_International_Conference_on_Natural_Language_Processing_Signal_and_Speech_Processing/links/63503ccc12cbac6a3eda8cac/Proceedings-of-the-International-Conference-on-Natural-Language-Processing-Signal-and-Speech-Processing.pdf#page=28},
 booktitle={Proc. Internat. Conference on Natural Language, Signal and Speech Processing (ICNLSSP)},
 year={2017},
 address={Casablanca, Morocco},
 keywords={recognition}
}

@inproceedings{chen2017mismatched,
 author={Wenda Chen and Mark Hasegawa-Johnson and Nancy F. Chen and Boon Pang Lim},
 title={Mismatched Crowdsourcing from Multiple Annotator Languages For Recognizing Zero-resourced Languages: A Nullspace Clustering Approach},
 booktitle={Proc. Interspeech},
 year={2017},
 pages={2789--2793},
  doi={10.21437/Interspeech.2017-1567},
 keywords={recognition}
}

@inproceedings{papadopoulos2017team,
 author={Pavlos Papadopoulos and Ruchir Travadi and Colin Vaz and Nikolaos Malandrakis and Ulf Hermjakob and Nima Pourdamghani and Michael Pust and Boliang Zhang and Xiaoman Pan and Di Lu and Ying Lin and Ondrej Glembek and Murali Karthick B and Martin Karafiat and Lukas Burget and Mark Hasegawa-Johnson and Heng Ji and Jonathan May and Kevin Knight and Shrikanth Narayanan},
 title={Team {ELISA} System for {DARPA LORELEI} Speech Evaluation 2016},
 booktitle={Proc. Interspeech},
 year={2017},
 keywords={recognition},
 pages={2053--2057},
  doi={10.21437/Interspeech.2017-180} 
}

@inproceedings{das2017deep,
 author={Amit Das and Mark Hasegawa-Johnson and Karel Vesely},
 title={Deep Autoencoder Based Multi-task Learning Using Probabilistic Transcription},
 booktitle={Proc. Interspeech},
 year={2017},
 pages={2073--2077},
 doi={10.21437/Interspeech.2017-582},
 keywords={recognition}
}

@phdthesis{zhang2017generative,
 author={Yang Zhang},
 title={Application of Generative Models in Speech Processing Tasks},
 url={https://www.ideals.illinois.edu/items/103415},
 school={University of Illinois},
 year={2017},
 keywords={recognition}
}

@inproceedings{jyothi2017low-resource,
 author={Preethi Jyothi and Mark Hasegawa-Johnson},
 title{Low-Resource Grapheme-to-Phoneme Conversion using Recurrent Neural Networks},
 booktitle={Proc. ICASSP},
 year={2017},
 pages={5030-5034},
 doi={10.1109/ICASSP.2017.7953114},
 keywords={recognition}
}

@inproceedings{hai2016speech,
 author={Van Hai Do and Nancy F. Chen and Boon Pang Lim and Mark Hasegawa-Johnson},
 title={Speech recognition of under-resourced languages using mismatched transcriptions},
 doi={10.1109/IALP.2016.7875947},
 booktitle={International Conference on Asian Language Processing IALP},
 year={2016},
 address={Tainan, Taiwan},
 month={11},
 keywords={recognition}
}

@inproceedings{hai2016a,
 author={Van Hai Do and Nancy F. Chen and Boon Pang Lim and Mark Hasegawa-Johnson},
 title={A many-to-one phone mapping approach for cross-lingual speech recognition},
 pages={120-124},
 doi={10.1109/RIVF.2016.7800280},
 booktitle={12th IEEE-RIVF International Conference on Computing and Communication Technologies},
 address={Hanoi, Vietnam},
 month={11},
 year={2016},
 keywords={recognition}
}

@inproceedings{das2016an,
 author={Amit Das and Mark Hasegawa-Johnson},
 title={An investigation on training deep neural networks using probabilistic transcription},
 booktitle=interspeech,
 year={2016},
  pages={3858--3862},
  doi={10.21437/Interspeech.2016-655},
  software={https://github.com/irrawaddy28/interspeech16-mtl},
 keywords={recognition}
}

@inproceedings{jyothi14_speechprosody,
  author={Preethi Jyothi and Jennifer Cole and Mark Hasegawa-Johnson and Vandana Puri},
  title={{An Investigation of Prosody in Hindi Narrative Speech}},
  year=2014,
  booktitle={Proc. Speech Prosody 2014},
  pages={623--627},
  doi={10.21437/SpeechProsody.2014-113}
}

@inproceedings{das2016automatic,
 author={Amit Das and Preethi Jyothi and Mark Hasegawa-Johnson},
 title={Automatic speech recognition using probabilistic transcriptions in Swahili, Amharic and Dinka},
 pages={3524--3528},
  doi={10.21437/Interspeech.2016-657},
  booktitle=interspeech,
 year={2016},
 software={https://github.com/irrawaddy28/africanpaper},
 keywords={recognition}
}

@inproceedings{liu2016adapting,
 author={Chunxi Liu and Preethi Jyothi and Hao Tang and Vimal Manohar and Rose Sloan and Tyler Kekona and Mark Hasegawa-Johnson and Sanjeev Khudanpur},
 title={Adapting ASR for Under-Resourced Languages Using Mismatched Transcriptions},
 doi={10.1109/ICASSP.2016.7472797},
 pages={5840-5844},
 booktitle={Proc. ICASSP},
 year={2016},
 keywords={recognition}
}

@inproceedings{das2015cross-lingual,
 author={Amit Das and Mark Hasegawa-Johnson},
 title={Cross-lingual transfer learning during supervised training in low resource scenarios},
 booktitle=interspeech,
 year={2015},
 pages={3531--3535},
 doi={10.21437/Interspeech.2015-700}, 
 keywords={recognition}
}

@inproceedings{chen2014an,
 author={Xiayu Chen and Yang Zhang and Mark Hasegawa-Jonson},
 booktitle=interspeech,
 year={2014},
 keywords={recognition},
  title={{An iterative approach to decision tree training for context dependent speech synthesis}},
  pages={2327--2331},
  doi={10.21437/Interspeech.2014-191}
}

@inproceedings{khasanova14_interspeech,
  author={Alina Khasanova and Jennifer Cole and Mark Hasegawa-Johnson},
  title={{Detecting articulatory compensation in acoustic data through linear regression modeling}},
  year=2014,
  booktitle={Proc. Interspeech 2014},
  pages={925--929},
  doi={10.21437/Interspeech.2014-241}
}

@inproceedings{elmahdy2014automatic,
 author={Mohamed Elmahdy and Mark Hasegawa-Johnson and Eiman Mustafawi},
 title={Automatic Long Audio Alignment and Confidence Scoring for Conversational Arabic Speech},
 url={http://www.lrec-conf.org/proceedings/lrec2014/pdf/434_Paper.pdf},
 booktitle={The 9th edition of the Language Resources and Evaluation Conference (LREC 2014)},
 year={2014},
 isbn={9782951740884},
 address={Reykjavik, Iceland},
 grant={QNRF NPRP 09-410-1-069},
 keywords={recognition}
}

@inproceedings{elmahdy000038development,
 author={Mohamed Elmahdy and Mark Hasegawa-Johnson and Eiman Mustafawi},
 title={Development of a TV Broadcasts Speech Recognition System for {Qatari Arabic}},
 url={http://www.lrec-conf.org/proceedings/lrec2014/pdf/430_Paper.pdf},
 booktitle={The 9th edition of the Language Resources and Evaluation Conference (LREC 2014)},
 year={2014},
 pages={3057-3061},
 isbn={9782951740884},
 address={Reykjavik, Iceland},
 grant={QNRF NPRP 09-410-1-069},
 keywords={recognition}
}

@unpublished{yeh2014divergence,
 author={Raymond Yeh},
 title={Divergence Guided Two Beams Viterbi Algorithm on Factorial HMMs},
 note={B.S. Thesis, University of Illinois},
 url={https://www.ideals.illinois.edu/items/55775},
 year={2014},
 keywords={recognition}
}

@inproceedings{elmahdy2013transfer,
 author={Mohamed Elmahdy and Mark Hasegawa-Johnson and Eiman Mustafawi},
 title={A Transfer Learning Approach for Under-Resourced Arabic Dialects Speech Recognition},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=a7e6a76e0c1f39171c2603657a94c8ba4418a788},
 booktitle={Workshop on Less Resourced Languages, new technologies, new challenges and opportunities (LTC 2013)},
 pages={60-64},
 year={2013},
 grant={QNRF NPRP 09-410-1-069},
 keywords={recognition}
}

@inproceedings{elmahdy2013automatic,
 author={Mohamed Elmahdy and Mark Hasegawa-Johnson and Eiman Mustafawi},
 title={Automatic Long Audio Alignment for Conversational Arabic Speech},
 booktitle={Qatar Foundation Annual Research Conference},
 year={2013},
 doi={10.5339/qfarf.2013.ICTP-03},
 keywords={recognition}
}

@inproceedings{elmahdy2013development,
 author={Mohamed Elmahdy and Mark Hasegawa-Johnson and Eiman Mustafawi},
 title={Development of a Spontaneous Large Vocabulary Speech Recognition System for Qatari Arabic},
 booktitle={Qatar Foundation Annual Research Conference},
 year={2013},
 doi={10.5339/qfarf.2013.ICTP-053},
 keywords={recognition}
}

@inproceedings{elmahdy2013framework,
 author={Mohamed Elmahdy and Mark Hasegawa-Johnson and Eiman Mustafawi},
 title={A Framework for Conversational Arabic Speech Long Audio Alignment},
 url={https://www.academia.edu/download/33424750/ltc-066-mohamed.pdf},
 booktitle={Proc. 6th Language and Technology Conference (LTC 2013)},
 year={2013},
 pages={290-293},
 grant={QNRF NPRP 09-410-1-069},
 keywords={recognition}
}

@inproceedings{bharadwaj2013sparse,
 author={Sujeeth Bharadwaj and Mark Hasegawa-Johnson and Jitendra Ajmera and Om Deshmukh and Ashish Verma},
 title={Sparse Hidden Markov Models for Purer Clusters},
 doi={10.1109/ICASSP.2013.6638228},
 booktitle={Proc. ICASSP},
 year={2013},
 keywords={recognition}
}

@inproceedings{elmahdy2012a,
 author={Mohamed Elmahdy and Mark Hasegawa-Johnson and Eiman Mustafawi},
 title={A Baseline Speech Recognition System for Levantine Colloquial Arabic},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=0dae1d58dddf914a9aed367e4a8045213e4202d5},
 booktitle={Proceedings of ESOLEC},
 year={2012},
 grant={QNRF NPRP 410-1-069},
 keywords={recognition}
}

@inproceedings{huang2012cross-dialectal,
 author={Po-Sen Huang and Mark Hasegawa-Johnson},
 title={Cross-Dialectal Data Transferring for Gaussian Mixture Model Training in Arabic Speech Recognition},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=5d995e455f1f08c0032b71fd7f0bcd1dcde5786b},
 booktitle={International Conference on Arabic Language Processing CITALA},
 year={2012},
 pages={119-122},
 isbn={978-9954-9135-0-5},
 grant={QNRF NPRP 410-1-069},
 keywords={recognition}
}

@inproceedings{elmahdy2011challenges,
 author={Mohamed Elmahdy and Mark Hasegawa-Johnson and Eiman Mustafawi and Rehab Duwairi and Wolfgang Minker},
 title={Challenges and Techniques for Dialectal Arabic Speech Recognition and Machine Translation},
 doi={10.5339/qfarf.2011.CSO5},
 booktitle={Qatar Foundation Annual Research Forum},
 year={2011},
 pages={244},
 grant={QNRF NPRP 410-1-069},
 keywords={recognition}
}

@phdthesis{huang2012semi-supervised,
 author={Jui-Ting Huang},
 title={Semi-Supervised Learning for Acoustic and Prosodic Modeling in Speech Applications},
 url={https://www.ideals.illinois.edu/items/32271},
 school={University of Illinois},
 year={2012},
 keywords={recognition}
}

@unpublished{hasegawajohnson2011learning,
 author={Mark Hasegawa-Johnson and Jui-Ting Huang and Roxana Girju and Rehab Mustafa Mohamma Duwairi and Eiman Mohd Tayyeb H B Mustafawi and Elabbas Benmamoun},
 title={Learning to Recognize Speech from a Small Number of Labeled Examples},
 doi={10.5339/qfarf.2011.CSP15},
 note={Qatar Foundation Annual Research Forum},
 year={2011},
 pages={269},
 grant={QNRF NPRP 410-1-069},
 keywords={recognition}
}

@article{hasegawajohnson2011normalized,
 author={Mark Hasegawa-Johnson and Jui-Ting Huang and Sarah King and Xi Zhou},
 title={Normalized recognition of speech and audio events},
 doi={10.1121/1.3655075},
 journal={Journal of the Acoustical Society of America},
 volume={130},
 pages={2524},
 year={2011},
 grant={NSF 0807329},
 keywords={recognition}
}

@article{hasegawajohnson2011semi-supervised,
 author={Mark Hasegawa-Johnson and Jui-Ting Huang and Xiaodan Zhuang},
 title={Semi-supervised learning for speech and audio processing},
 doi={10.1121/1.3654654},
 journal={Journal of the Acoustical Society of America},
 volume={130},
 pages={2408},
 year={2011},
 grant={NSF 0703624},
 keywords={recognition}
}

@phdthesis{pang2011computational,
 author={Boon Pang Lim},
 title={Computational Differences between Whispered and Non-whispered Speech},
 url={https://www.ideals.illinois.edu/items/24896},
 school={University of Illinois},
 year={2011},
 keywords={recognition}
}

@inproceedings{huang2011how,
 author={Jui-Ting Huang and Mark Hasegawa-Johnson and Jennifer Cole},
 title={How Unlabeled Data Change the Acoustic Models For Phonetic Classification},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=a6231219eed53704d7afb38176db1aa04705a1f6},
 booktitle={Workshop on New Tools and Methods for Very Large Scale Phonetics Research},
 address={University of Pennsylvania},
 month={Jan.},
 year={2011},
 keywords={recognition}
}

@inproceedings{huang2010prosody-dependent,
 author={Jui-Ting Huang and Po-Sen Huang and Yoonsook Mo and Mark Hasegawa-Johnson and Jennifer Cole},
 title={Prosody-Dependent Acoustic Modeling Using Variable-Parameter Hidden Markov Models},
 url={https://www.isca-speech.org/archive/speechprosody_2010/huang10_speechprosody.html},
 booktitle={Speech Prosody},
 year={2010},
 pages={100623:1-4},
 grant={NSF 0703624},
 keywords={recognition}
}

@inproceedings{tang2010toward,
 author={Hao Tang and Mark Hasegawa-Johnson and Thomas S. Huang},
 title={Toward Robust Learning of the Gaussian Mixture State Emission Densities for Hidden Markov Models},
 doi={10.1109/ICASSP.2010.5494989},
 booktitle={ICASSP},
 year={2010},
 grant={NSF 0803219},
 keywords={recognition}
}

@inproceedings{huang2009kernel,
 author={Jui-Ting Huang and Xi Zhou and Mark Hasegawa-Johnson and Thomas Huang},
 title={Kernel Metric Learning for Phonetic Classification},
 doi={10.1109/ASRU.2009.5373389},
 booktitle={ASRU},
 year={2009},
 pages={141-145},
 grant={NSF 0703624},
 keywords={recognition}
}

@inproceedings{zhuang2009articulatory,
 author={Xiaodan Zhuang and Hosung Nam and Mark Hasegawa-Johnson and Louis Goldstein and Elliot Saltzman},
 title={Articulatory Phonological Code for Word Recognition},
 booktitle=interspeech,
 pages={2763--2766},
  doi={10.21437/Interspeech.2009-706},
  address={Brighton},
 month={September},
 year={2009},
 grant={NSF 0703624},
 keywords={recognition}
}

@inproceedings{lee2009a,
 author={Bowon Lee and Mark Hasegawa-Johnson},
 title={A Phonemic Restoration Approach for Automatic Speech Recognition with Highly Nonstationary Background Noise},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=66f31946db0456df7be1f6b09528e2f5be8f84e0},
 booktitle={DSP in Cars workshop},
 address={Dallas},
 month={July},
 year={2009},
 keywords={recognition}
}

@inproceedings{huang2009on,
 author={Jui-Ting Huang and Mark Hasegawa-Johnson},
 title={On semi-supervised learning of Gaussian mixture models for phonetic classification},
 url={https://aclanthology.org/W09-2210.pdf},
 booktitle={NAACL HLT Workshop on Semi-Supervised Learning},
 year={2009},
 pages={75-83},
 grant={NSF 0534106},
 keywords={recognition}
}

@inproceedings{huang2008maximum,
 author={Jui-Ting Huang and Mark Hasegawa-Johnson},
 title={Maximum Mutual Information Estimation with Unlabeled Data for Phonetic Classification},
 url={https://www.isca-archive.org/interspeech_2008/huang08_interspeech.pdf},
 booktitle={Proc. Interspeech},
 year={2008},
 grant={NSF 0534133},
 keywords={recognition}
}

@inproceedings{zhuang000061the,
 author={Xiaodan Zhuang and Hosung Nam and Mark Hasegawa-Johnson and Louis Goldstein and Elliot Saltzman},
 title={The Entropy of Articulatory Phonological Code: Recognizing Gestures from Tract Variables},
 doi={10.21437/Interspeech.2008-428},
 booktitle=interspeech,
 year={2008},
  pages={1489--1492}, 
 grant={NSF 0703624},
 keywords={recognition}
}

@inproceedings{kantor2008stream,
 author={Arthur Kantor and Mark Hasegawa-Johnson},
 title={Stream Weight Tuning in Dynamic Bayesian Networks},
 doi={10.1109/ICASSP.2008.4518662},
 booktitle={Proc. ICASSP},
 pages={4525-4528},
 year={2008},
 grant={NSF 0703624},
 keywords={recognition}
}

@phdthesis{lee2006robust,
 author={Bowon Lee},
 title={Robust Speech Recognition in a Car Using a Microphone Array},
 url={https://www.ideals.illinois.edu/items/82279},
 year={2006},
 school={University of Illinois},
 keywords={recognition}
}

@inproceedings{hasegawajohnson2004landmark,
 author={Mark Hasegawa-Johnson and James Baker and Sarah Borys and Ken Chen and Emily Coogan and Steven Greenberg and Amit Juneja and Katrin Kirchhoff and Karen Livescu and Srividya Mohan and Jennifer Muller and Kemal Sönmez and Tianyu Wang},
 title={Landmark-Based Speech Recognition: Report of the 2004 Johns Hopkins Summer Workshop},
 doi={10.1109/ICASSP.2005.1415088},
 booktitle={ICASSP},
 month={March},
 year={2005},
 pages={1213-1216},
 grant={NSF 0121285},
 keywords={recognition}
}

@inproceedings{omar2003non-linear,
  author={Mohamed Kamal Omar and Mark Hasegawa-Johnson},
  title={{Non-linear maximum likelihood feature transformation for speech recognition}},
  year=2003,
  booktitle={Proc. 8th European Conference on Speech Communication and Technology (Eurospeech 2003)},
  pages={2497--2500},
  doi={10.21437/Eurospeech.2003-685}
}

@inproceedings{kim2005phonetic,
 author={Yeojin Kim and Mark Hasegawa-Johnson},
 title={Phonetic Segment Rescoring Using SVMs},
 booktitle={Midwest Computational Linguistics Colloquium},
 address={Columbus, OH},
 year={2005},
 grant={NSF 0132900},
 keywords={recognition}
}

@unpublished{hasegawajohnson2005landmark-based,
 author={Mark Hasegawa-Johnson and James Baker and Steven Greenberg and Katrin Kirchhoff and Jennifer Muller and Kemal Sonmez and Sarah Borys and Ken Chen and Amit Juneja and Katrin Kirchhoff and Karen Livescu and Srividya Mohan and Emily Coogan and Tianyu Wang},
 title={Landmark-Based Speech Recognition: Report of the 2004 Johns Hopkins Summer Workshop},
 note={Final report of the WS04 Johns Hopkins Summer Workshop team},
 number={WS04},
 year={2005},
 keywords={recognition}
}

@unpublished{hasegawajohnson2004landmark-based,
 author={Mark Hasegawa-Johnson},
 title={Landmark-Based Speech Recognition: The Marriage of High-Dimensional Machine Learning Techniques with Modern Linguistic Representations},
 booktitle={talk given at Tsinghua University},
 month={October},
 year={2004},
 grant={NSF 0132900},
 keywords={recognition}
}

@inproceedings{hasegawajohnson2004factorial,
 author={Mark Hasegawa-Johnson and Ameya Deoras},
 title={A Factorial HMM Approach to Robust Isolated Digit Recognition in Background Music.},
 booktitle=interspeech,
 month={October},
 year={2004},
 grant={NSF 0132900},
 pages={2093--2096}, 
 doi={10.21437/Interspeech.2004-637}, 
 keywords={recognition}
}

@inproceedings{deoras2004icassp,
 author={Ameya Deoras and Mark Hasegawa-Johnson},
 title={A Factorial HMM Approach to Simultaneous Recognition of Isolated Digits Spoken by Multiple Talkers on One Audio Channel},
 doi={10.1109/ICASSP.2004.1326122},
 booktitle={ICASSP},
 year={2004},
 grant={NSF 0132900},
 keywords={recognition}
}

@inproceedings{zheng2003acoustic,
 author={Yanli Zheng and Mark Hasegawa-Johnson},
 title={Acoustic segmentation using switching state Kalman Filter},
 doi={10.1109/ICASSP.2003.1198890},
 booktitle={ICASSP},
 year={2003},
 month={April},
 pages={I:752-755},
 grant={NSF 0132900},
 keywords={recognition}
}

@unpublished{deoras2003a,
 author={Ameya Deoras},
 title={A Factorial HMM Approach to Robust Isolated Digit Recognition in Non-Stationary Noise.},
 note={B.S. Thesis, University of Illinois},
 year={2003},
 keywords={recognition}
}

@inproceedings{omar2001gaussian,
 author={Mohammed K. Omar and Mark Hasegawa-Johnson and Stephen E. Levinson},
 title={Gaussian Mixture Models of Phonetic Boundaries for Speech Recognition},
 doi={10.1109/ASRU.2001.1034582},
 booktitle={ASRU},
 year={2001},
 grant={NSF 0132900},
 keywords={recognition}
}

@inproceedings{hasegawajohnson2000multivariate-state,
 author={Mark Hasegawa-Johnson},
 title={Multivariate-State Hidden Markov Models for Simultaneous Transcription of Phones and Formants},
 doi={10.1109/ICASSP.2000.861822},
 booktitle={ICASSP},
 address={Istanbul},
 pages={1323-1326},
 year={2000},
 keywords={recognition}
}

@inproceedings{morshed22_interspeech,
  author={Mahir Morshed and Mark Hasegawa-Johnson},
  title={{Cross-lingual articulatory feature information transfer for speech recognition using recurrent progressive neural networks}},
  year=2022,
  booktitle={Proc. Interspeech 2022},
  pages={2298--2302},
  doi={10.21437/Interspeech.2022-11202}
}

@article{he2018acoustic,
 author={Di He and Boon Pang Lim and Xuesong Yang and Mark Hasegawa-Johnson and Deming Chen},
 title={Acoustic landmarks contain more information about the phone string than other frames for automatic speech recognition with deep neural network acoustic model},
 url={https://asa.scitation.org/doi/full/10.1121/1.5039837},
 journal={Journal of the Acoustical Society of America},
 year={2018},
 volume={143},
 number={6},
 pages={3207-3219},
 doi={10.1121/1.5039837},
 keywords={recognition}
}

@inproceedings{kong2017landmark,
 author={Xiang Kong and Xuesong Yang and Jeung-Yoon Choi and Mark Hasegawa-Johnson and Stefanie Shattuck-Hufnagel},
 title={Landmark-based consonant voicing detection on multilingual corpora},
 doi={10.1121/1.4987203},
 booktitle={Acoustics 17},
 address={Boston},
 month={June},
 year={2017},
 keywords={recognition}
}

@inproceedings{qian2016application,
 author={Kaizhi Qian and Yang Zhang and Mark Hasegawa-Johnson},
 title={Application of Local Binary Patterns for SVM based Stop Consonant Detection},
 pages={1114--1118},
 doi={10.21437/SpeechProsody.2016-229},
 booktitle={Speech Prosody},
 year={2016},
 keywords={recognition}
}

@inproceedings{king2013accurate,
 author={Sarah King and Mark Hasegawa-Johnson},
 title={Accurate Speech Segmentation by Mimicking Human Auditory Processing},
 doi={10.1109/ICASSP.2013.6639242},
 booktitle={Proc. ICASSP},
 year={2013},
 grant={NSF 0807329},
 keywords={recognition}
}

@inproceedings{huang2013random,
 author={Po-Sen Huang and Li Deng and Mark Hasegawa-Johnson and Xiaodong He},
 title={Random Features for Kernel Deep Convex Network},
 doi={10.1109/ICASSP.2013.6638237},
 booktitle={Proc. ICASSP},
 year={2013},
 pages={8096--8900},
 keywords={recognition}
}

@inproceedings{king2012detection,
 author={Sarah King and Mark Hasegawa-Johnson},
 title={Detection of Acoustic-Phonetic Landmarks in Mismatched Conditions Using a Biomimetic Model of Human Auditory Processing},
 url={https://aclanthology.org/C12-2058.pdf},
 booktitle={CoLing},
 year={2012},
 pages={589--598},
 grant={QNRF NPRP 09-410-1-069},
 keywords={recognition}
}

@inproceedings{hasegawajohnson2012on,
 author={Mark Hasegawa-Johnson and Elabbas Benmamoun and Eiman Mustafawi and Mohamed Elmahdy and Rehab Duwairi},
 title={On The Definition of the Word `Segmental'},
 url={https://www.isca-speech.org/archive/speechprosody_2012/hasegawajohnson12_speechprosody.html},
 booktitle={Speech Prosody},
 year={2012},
 pages={159-162},
 isbn={978-7-5608-486-3},
 keywords={recognition}
}

@inproceedings{liu2007frequency,
 author={Ming Liu and Xi Zhou and Mark Hasegawa-Johnson and Thomas S. Huang and Zhengyou Zhang},
 title={Frequency Domain Correspondence for Speaker Normalization},
  doi={10.21437/Interspeech.2007-120},
  booktitle={Proc. Interspeech},
 pages={274-277},
 address={Antwerp},
 month={August},
 year={2007},
 keywords={recognition}
}

@inproceedings{borys2005distinctive,
 author={Sarah Borys and Mark Hasegawa-Johnson},
 title={Distinctive Feature Based {SVM} Discriminant Features for Improvements to Phone Recognition on Telephone Band Speech},
 doi={10.21437/Interspeech.2005-200},
 booktitle={ISCA Interspeech},
 month={October},
 year={2005},
 grant={NSF 0132900},
 keywords={recognition}
}

@phdthesis{zheng2005feature,
 author={Yanli Zheng},
 url={https://www.ideals.illinois.edu/items/82196},
 title={Acoustic Modeling and Feature Extraction for Speech Recognition},
 year={2005},
 school={University of Illinois},
 keywords={recognition}
}

@inproceedings{hasegawajohnson2004experiments,
 author={Mark Hasegawa-Johnson and Sarah Borys and Ken Chen},
 title={Experiments in Landmark-Based Speech Recognition},
 booktitle={Sound to Sense: Workshop in Honor of Kenneth N. Stevens},
 month={June},
 year={2004},
 grant={NSF 0132900},
 keywords={recognition}
}

@unpublished{geirhofer2004feature,
 author={Stefan Geirhofer},
 year={2004},
 title={Feature Reduction with Linear Discriminant Analysis and its Performance on Phoneme Recognition},
 note={Undergraduate research project},
 keywords={recognition}
}

@phdthesis{omar2003acoustic,
 author={Mohamed Kamal Mahmoud Omar},
 title={Acoustic Feature Design for Speech Recognition: A Statistical Information-Theoretic Approach},
 url={https://www.ideals.illinois.edu/items/82130},
 year={2003},
 school={University of Illinois},
 keywords={recognition}
}

@article{omar2003approximately,
 author={Mohammed Kamal Omar and Mark Hasegawa-Johnson},
 title={Approximately Independent Factors of Speech Using Nonlinear Symplectic Transformation},
 doi={10.1109/TSA.2003.814457},
 journal={IEEE Transactions on Speech and Audio Processing},
 volume={11},
 number={6},
 pages={660-671},
 year={2003},
 grant={NSF 0132900},
 keywords={recognition}
}

@inproceedings{omar2003ccct,
 author={Mohammed Kamal Omar and Mark Hasegawa-Johnson},
 title={Non-Linear Independent Component Analysis for Speech Recognition},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=d95f5f7198a3463efa9490533550de5ec02234e2},
 booktitle={International Conference on Computer, Communication and Control Technologies (CCCT '03)},
 year={2003},
 grant={NSF 0132900},
 keywords={recognition}
}

@inproceedings{omar2003strong-sense,
 author={Mohammed Kamal Omar and Mark Hasegawa-Johnson},
 title={Strong-Sense Class-Dependent Features for Statistical Recognition},
 doi={10.1109/SSP.2003.1289454},
 booktitle={IEEE Workshop on Statistical Signal Processing},
 address={St. Louis, MO},
 year={2003},
 pages={473-476},
 grant={NSF 0132900},
 keywords={recognition}
}

@inproceedings{omar2003maximum,
 author={Mohammed Kamal Omar and Mark Hasegawa-Johnson},
 title={Maximum Conditional Mutual Information Projection For Speech Recognition},
 booktitle=interspeech,
 month={September},
 year={2003},
 pages={505-508},
 doi={10.21437/Eurospeech.2003-181}, 
 grant={NSF 0132900},
 keywords={recognition}
}

@inproceedings{omar2003interspeech,
 author={Mohammed Kamal Omar and Mark Hasegawa-Johnson},
 title={Non-Linear Maximum Likelihood Feature Transformation For Speech Recognition},
 doi={10.21437/Eurospeech.2003-685},
 booktitle=interspeech,
 month={September},
 year={2003},
 pages={2497-2500},
 grant={NSF 0132900},
 keywords={recognition}
}

@article{hasegawajohnson2002finding,
 author={Mark Hasegawa-Johnson},
 title={Finding the Best Acoustic Measurements for Landmark-Based Speech Recognition},
 journal={Accumu Magazine},
 publisher={Kyoto Computer Gakuin},
 address={Kyoto, Japan},
 year={2002},
 volume={11},
 pages={45-47},
 grant={NSF 0132900},
 keywords={recognition}
}

@inproceedings{omar2002evaluation,
 author={Mohammed Kamal Omar and Ken Chen and Mark Hasegawa-Johnson and Yigal Brandman},
 title={An Evaluation of using Mutual Information for Selection of Acoustic-Features Representation of Phonemes for Speech Recognition},
 booktitle=interspeech,
 address={Denver, CO},
 month={September},
 year={2002},
 pages={2129-2132},
 doi={10.21437/ICSLP.2002-582},
 keywords={recognition}
}

@inproceedings{jing2002auditory-modeling,
 author={Zhinian Jing and Mark Hasegawa-Johnson},
 title={Auditory-Modeling Inspired Methods of Feature Extraction for Robust Automatic Speech Recognition},
 doi={10.1109/ICASSP.2002.5745632},
 booktitle={ICASSP},
 month={May},
 year={2002},
 pages={IV:4176},
 grant={NSF 0132900},
 keywords={recognition}
}

@inproceedings{omar2002maximum,
 author={Mohammed Kamal Omar and Mark Hasegawa-Johnson},
 title={Maximum Mutual Information Based Acoustic Features Representation of Phonological Features for Speech Recognition},
 doi={10.1109/ICASSP.2002.5743659},
 booktitle={ICASSP},
 month={May},
 year={2002},
 pages={I:81-84},
 keywords={recognition}
}

@inproceedings{gunawan2001plp,
 author={Wira Gunawan and Mark Hasegawa-Johnson},
 title={PLP Coefficients can be Quantized at 400 bps},
 doi={10.1109/ICASSP.2001.940771},
 booktitle={ICASSP},
 address={Salt Lake City, UT},
 pages={2.2.1-4},
 year={2001},
 keywords={recognition}
}

@inproceedings{wang2022self,
 author={Liming Wang and Siyuan Feng and Mark A. Hasegawa-Johnson and Chang D. Yoo},
 title={Self-supervised Semantic-driven Phoneme Discovery for Zero-resource Speech Recognition},
 doi={10.18653/v1/2022.acl-long.553},
 booktitle={ACL},
 year={2022},
 month={5},
 pages={8027–8047},
 keywords={recognition}
}

@article{zelasko2021discovering,
 author={Piotr Zelasko and Siyuan Feng and Laureano Moro-Velazquez and Ali Abavisani and Saurabchand Bhati and Odette Scharenborg and Mark Hasegawa-Johnson and Najim Dehak},
 title={Discovering Phonetic Inventories with Crosslingual Automatic Speech Recognition},
 journal={Computer Speech and Language},
 year={2022},
 month={7},
 volume={74},
 pages={101358:1-54},
 keywords={recognition},
 doi={10.1016/j.csl.2022.101358},
}

@inproceedings{feng2021how,
 author={Siyuan Feng and Piotr Żelasko and Laureano Moro-Velázquez and Ali Abavisani and Mark Hasegawa-Johnson and Odette Scharenborg and Najim Dehak},
 title={How Phonotactics Affect Multilingual and Zero-shot ASR Performance},
 doi={10.1109/ICASSP39728.2021.9414478},
 booktitle={Proc. ICASSP},
 year={2021},
 pages={7238-7242},
 keywords={recognition}
}

@inproceedings{jyothi15_interspeech,
  author={Preethi Jyothi and Mark Hasegawa-Johnson},
  title={{Transcribing continuous speech using mismatched crowdsourcing}},
  year=2015,
  booktitle={Proc. Interspeech 2015},
  pages={2774--2778},
  doi={10.21437/Interspeech.2015-584}
}

@inproceedings{jyothi2015improving,
 author={Preethi Jyothi and Mark Hasegawa-Johnson},
 title={Improving Hindi Broadcast ASR by Adapting the Language Model and Pronunciation Model Using A Priori Syntactic and Morphophonemic Knowledge},
 booktitle=interspeech,
 year={2015},
 pages={3164--3168},
 keywords={recognition},
  doi={10.21437/Interspeech.2015-637} 
}

@inproceedings{abunasser2013pronunciation,
 author={Mahmoud Abunasser and Abbas Benmamoun and Mark Hasegawa-Johnson},
 title={Pronunciation Variation Metric for Four Dialects of Arabic},
 booktitle={AIDA 10 (Association Internationale de Dialectologie Arabe)},
 address={Qatar University},
 year={2013},
 keywords={recognition}
}

@article{elmahdy2012ijcl,
 author={Mohamed Elmahdy and Mark Hasegawa-Johnson and Eiman Mustafawi},
 title={Hybrid Phonemic and Graphemic Modeling for Arabic Speech Recognition},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=78b19225125b6be20ed942ea380ed7d8657c71dd},
 journal={International Journal of Computational Linguistics},
 volume={3},
 number={1},
 pages={88-96},
 issn={2180-1266},
 grant={QNRF NPRP 09-410-1-069},
 year={2012},
 keywords={recognition}
}

@inproceedings{elmahdy2012qnrf,
 author={Mohamed Elmahdy and Mark Hasegawa-Johnson and Eiman Mustafawi},
 title={Hybrid Pronunciation Modeling for Arabic Large Vocabulary Speech Recognition},
 doi={10.5339/qfarf.2012.CSO3},
 booktitle={Qatar Foundation Annual Research Forum},
 year={2012},
 grant={QNRF 09-410-1-069},
 keywords={recognition}
}

@inproceedings{kantor2011hmm-based,
 author={Arthur Kantor and Mark Hasegawa-Johnson},
 title={HMM-based Pronunciation Dictionary Generation},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=66a415c3c988807ed959fc159fd95786ee8f0029},
 booktitle={Workshop on New Tools and Methods for Very Large Scale Phonetics Research},
 address={University of Pennsylvania},
 month={Jan.},
 year={2011},
 grant={NSF 0703624},
 software={http://mickey.ifp.illinois.edu/speechWiki/index.php/Phonetic_Transcription_Tool},
 keywords={recognition}
}

@phdthesis{kantor2010pronunciation,
 author={Arthur Kantor},
 title={Pronunciation modeling for large vocabulary speech recognition},
 url={https://www.ideals.illinois.edu/items/18366},
 year={2010},
 school={University of Illinois},
 software={http://mickey.ifp.illinois.edu/speechWiki/index.php/GMTK_parallel_tools},
 keywords={recognition}
}

@inproceedings{hu2010interspeech,
 author={Chi Hu and Xiaodan Zhuang and Mark Hasegawa-Johnson},
 title={FSM-Based Pronunciation Modeling using Articulatory Phonological Code},
 booktitle={Proceedings of Interspeech},
 year={2010},
 pages={2274--2277},
  doi={10.21437/Interspeech.2010-624}, 
 grant={NSF 0703624},
 keywords={recognition}
}

@inproceedings{nam2010a,
 author={Hosung Nam and Vikramjit Mitra and Mark Tiede and Elliot Saltzman and Louis Goldstein and Carol Espy-Wilson and Mark Hasegawa-Johnson},
 title={A procedure for estimating gestural scores from natural speech},
 pages={30--33},
  doi={10.21437/Interspeech.2010-4},
  booktitle={Proceedings of Interspeech},
 year={2010},
 grant={NSF 0703624},
 keywords={recognition}
}

@inproceedings{chen2004modeling,
 author={Ken Chen and Mark Hasegawa-Johnson},
 title={Modeling pronunciation variation using artificial neural networks for English spontaneous speech},
 booktitle=interspeech,
 month={October},
 doi={10.21437/Interspeech.2004-557}, 
 year={2004},
 pages={400-403},
 grant={NSF 0414117},
 keywords={recognition}
}

@inproceedings{xu2023dual,
 author={Zhongweiyang Xu and Xulin Fan and Mark Hasegawa-Johnson},
 title={Dual-Path Cross-Modal Attention for better Audio-Visual Speech Extraction},
 booktitle={Proceedings of ICASSP},
 year={2023},
 note={Recognized as one of the top 3\% of papers at the conference},
 url={https://drive.google.com/file/d/1IHK4EWuOiBX11fA7mdzUHIhCWK5ahOwf/view},
 doi={10.1109/ICASSP49357.2023.10096732},
 keywords={recognition}
}

@inproceedings{van2020evaluating,
 author={Justin van der Hout and Mark Hasegawa-Johnson and Odette Scharenborg},
 title={Evaluating Automatically Generated Phoneme Captions for Images},
 url={https://arxiv.org/abs/2007.15916},
 booktitle={Proc. Interspeech},
 year={2020},
 keywords={recognition},
  pages={2317--2321},
  doi={10.21437/Interspeech.2020-2870} 
}

@inproceedings{wang2020a,
 author={Liming Wang and Mark Hasegawa-Johnson},
 booktitle={Proc. Interspeech},
 year={2020},
 keywords={recognition},
 title={{A DNN-HMM-DNN Hybrid Model for Discovering Word-Like Units from Spoken Captions and Image Regions}},
 pages={1456--1460},
 doi={10.21437/Interspeech.2020-1148}
}

@article{wang2020multimodal,
 author={Liming Wang and Mark Hasegawa-Johnson},
 title={Multimodal word discovery and retrieval with spoken descriptions and visual concepts},
 journal={IEEE Transactions on Audio, Speech and Language},
 volume={28},
 pages={1560-1573},
 year={2020},
 doi={10.1109/TASLP.2020.2996082},
 keywords={recognition}
}

@article{scharenborg2021international,
 author={Odette Scharenborg and Mark Hasegawa-Johnson},
 title={Position Paper: Brain Signal-based Dialogue Systems},
 doi={10.1007/978-981-15-9323-9_36},
 journal={Lecture Notes in Computer Science},
 volume={714},
 year={2021},
 month={3},
 editor={Marchi, E., Siniscalchi, S.M., Cumani, S., Salerno, V.M., Li, H.},
 keywords={recognition}
}

@inproceedings{sari2018interspeech,
 author={Leda Sari and Mark Hasegawa-Johnson and S. Kumaran and Georg Stemmer and N. Nair Krishnakumar},
 title={Speaker Adaptive Audio-Visual Fusion for the Open-Vocabulary Section of AVICAR},
 booktitle={Proc. Interspeech},
 year={2018},
 pages={3524--3528},
 doi={10.21437/Interspeech.2018-2359},
 keywords={recognition}
}

@inproceedings{bharadwaj2012multi-view,
 author={Sujeeth Bharadwaj and Raman Arora and Karen Livescu and Mark Hasegawa-Johnson},
 title={Multi-View Acoustic Feature Learning Using Articulatory Measurements},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=2106a2dce0f7c3ea611499ed93187dcee841fc16},
 booktitle={IWSML (Internat. Worksh. on Statistical Machine Learning for Sign. Process.)},
 year={2012},
 grant={NSF 0905633},
 keywords={recognition}
}

@inproceedings{hasegawajohnson2007multi-stream,
 author={Mark Hasegawa-Johnson},
 title={Multi-Stream Approach to Audiovisual Automatic Speech Recognition},
 doi={10.1109/MMSP.2007.4412884},
 booktitle={IEEE 9th Workshop on Multimedia Signal Processing (MMSP)},
 pages={328-331},
 year={2007},
 keywords={recognition}
}

@inproceedings{hasegawajohnson2007audiovisual,
 author={Mark Hasegawa-Johnson and Karen Livescu and Partha Lal and Kate Saenko},
 title={Audiovisual Speech Recognition with Articulator Positions as Hidden Variables},
 url={https://www.researchgate.net/profile/K-Livescu/publication/228926670_Audiovisual_speech_recognition_with_articulator_positions_as_hidden_variables/links/00b7d5201284197994000000/Audiovisual-speech-recognition-with-articulator-positions-as-hidden-variables.pdf},
 booktitle={Proc. International Congress on Phonetic Sciences (ICPhS)},
 pages={1719:297-302},
 address={Saarbrücken},
 month={August},
 year={2007},
 grant={NSF 0121285},
 keywords={recognition}
}

@unpublished{hasegawajohnson2007audio-visual,
 author={Mark Hasegawa-Johnson},
 title={Audio-Visual Speech Recognition: Audio Noise, Video Noise, and Pronunciation Variability},
 note={talk given to the Signal Processing Society, IEEE Japan},
 month={June},
 year={2007},
 grant={NSF 0534106},
 keywords={recognition}
}

@inproceedings{fu2007lipreading,
 author={Yun Fu and Xi Zhou and Ming Liu and Mark Hasegawa-Johnson and Thomas S. Huang},
 title={Lipreading by Locality Discriminant Graph},
 doi={10.1109/ICIP.2007.4379312},
 booktitle={IEEE International Conference on Image Processing (ICIP)},
 pages={III:325-8},
 year={2007},
 grant={NSF 0426627},
 keywords={recognition}
}

@inproceedings{livescu2007articulatory,
 author={Karen Livescu and Ozgur Cetin and Mark Hasegawa-Johnson and Simon King and Chris Bartels and Nash Borges and Arthur Kantor and Partha Lal and Lisa Yung and Ari Bezman and Stephen Dawson-Haggerty and Bronwyn Woods and Joe Frankel and Matthew Magimai-Doss and Kate Saenko},
 title={Articulatory Feature-Based Methods for Acoustic and Audio-Visual Speech Recognition: Summary from the 2006 JHU Summer Workshop},
 doi={10.1109/ICASSP.2007.366989},
 booktitle={ICASSP},
 month={May},
 year={2007},
 pages={621-624},
 keywords={recognition}
}

@unpublished{livescu2007articulatory-feature-based,
 author={Karen Livescu and Özgür Çetin and Mark Hasegawa-Johnson and Simon King and Chris Bartels and Nash Borges and Arthur Kantor and Partha Lal and Lisa Yung and Ari Bezman and Stephen Dawson-Hagerty and Bronwyn Woods and Joe Frankel and Mathew Magimai-Doss and Kate Saenko},
 title={Articulatory-Feature-Based Methods for Acoustic and Audio-Visual Speech Recognition: 2006 JHU Summer Workshop Final Report.},
 note={Final report of the WS06 Johns Hopkins Summer Workshop team},
 year={2007},
 keywords={recognition}
}

@unpublished{hasegawajohnson2006object,
 author={Mark Hasegawa-Johnson},
 title={Object Tracking and Asynchrony in Audio-Visual Speech Recognition.},
 note={talk given to the Artificial Intelligence, Vision, and Robotics seminar series},
 month={August},
 year={2006},
 grant={NSF 0534106},
 keywords={recognition}
}

@inproceedings{hasegawajohnson2006dealing,
 author={Mark Hasegawa-Johnson},
 title={Dealing with Acoustic Noise. Part IIII: Video},
 booktitle={tutorial presentation given at WS06, Center for Language and Speech Processing},
 month={July},
 year={2006},
 grant={NSF 0121285},
 keywords={recognition}
}

@unpublished{goudeseune2006avicar,
 author={Camille Goudeseune and Bowon Lee},
 title={AVICAR: Audio-Visual Speech Recognition in a Car Environment},
 booktitle={Promotional Film},
 year={2006},
 grant={Motorola RPS19},
 keywords={recognition}
}

@inproceedings{lee2004avicar,
 author={Bowon Lee and Mark Hasegawa-Johnson and Camille Goudeseune and Suketu Kamdar and Sarah Borys and Ming Liu and Thomas Huang},
 title={AVICAR: Audio-Visual Speech Corpus in a Car Environment.},
 booktitle=interspeech,
 month={October},
 year={2004},
 pages={380-383},
 grant={Motorola RPS19},
 doi={10.21437/Interspeech.2004-424},
 keywords={recognition}
}

@inproceedings{levinson2002multimodal,
 author={Stephen E. Levinson and Thomas S. Huang and Mark A. Hasegawa-Johnson and Ken Chen and Stephen Chu and Ashutosh Garg and Zhinian Jing and Danfeng Li and J. Lin and Mohammed Kamal Omar and Z. Wen},
 title={Multimodal Dialog Systems Research at Illinois},
 url={https://apps.dtic.mil/sti/pdfs/ADA415344.pdf#page=39},
 booktitle={ARPA Workshop on Multimodal Speech Recognition and SPINE},
 month={June},
 year={2002},
 grant={NSF 0132900},
 keywords={recognition}
}

@inproceedings{hasegawajohnson2020multimodal,
 author={Mark Hasegawa-Johnson},
 title={Multimodal Distant Supervision},
 booktitle={NeurIPS Workshop on Self-Supervised Learning for Speech and Audio},
 year={2020},
 url={https://slideslive.com/38938462/multimodal-distant-supervision}
 }

@inproceedings{gao22e_interspeech,
  author={Heting Gao and Junrui Ni and Kaizhi Qian and Yang Zhang and Shiyu Chang and Mark Hasegawa-Johnson},
  title={{WavPrompt: Towards Few-Shot Spoken Language Understanding with Frozen Language Models}},
  year=2022,
  booktitle={Proc. Interspeech 2022},
  pages={2738--2742},
  doi={10.21437/Interspeech.2022-11031}
}

@inproceedings{sari2020training,
 author={Leda Sar\i and Samuel Thomas and Mark Hasegawa-Johnson},
 title={Training Spoken Language Understanding Systems with Non-Parallel Speech and Text},
 doi={10.1109/ICASSP40776.2020.9054664},
 booktitle={Proc. ICASSP},
 year={2020},
 pages={8109-8113},
 keywords={recognition}
}

@inproceedings{wang2023a,
 author={Liming Wang and Mark Hasegawa-Johnson and Chang D. Yoo},
 title={A Theory of Unsupervised Speech Recognition},
 booktitle={ACL},
 year={2023},
 month={7},
 url={https://arxiv.org/abs/2306.07926},
 keywords={recognition}
}

@inproceedings{wu2024just,
 title={Just ASR + LLM? A Study on Speech Large Language Models’ Ability to Identify and Understand Speaker in Spoken Dialogue},
 url={https://arxiv.org/abs/2409.04927},
 author={Junkai Wu and Xulin Fan and Bo-Ru Lu and Xilin Jiang and Nima Mesgarani and Mark Hasegawa-Johnson and Mari Ostendorf},
 booktitle=slt,
 year={2024},
 month={12}
 }
 
@inproceedings{wang2023speak,
 author={Liming Wang and Junrui Ni and Heting Gao and Jialu Li and Kai Chieh Chang and Xulin Fan and Junkai Wu and Mark Hasegawa-Johnson and Chang D. Yoo},
 title={Speak and Decipher and Sign: Toward Unsupervised Speech-to-Sign Language Recognition},
 booktitle={Findings of ACL},
 year={2023},
 month={7},
 url={https://aclanthology.org/2023.findings-acl.424/},
 keywords={recognition}
}

@inproceedings{wang2021align,
 author={Liming Wang and Xinsheng Wang and Mark Hasegawa-Johnson and Odette Scharenborg and Najim Dehak},
 title={Align or Attend? Toward More Efficient and Accurate Spoken Word Discovery Using Speech-to-Image Retrieval},
 doi={10.1109/ICASSP39728.2021.9414418},
 booktitle={Proc. ICASSP},
 year={2021},
 keywords={recognition}
}

@inproceedings{wang2019multimodal,
 author={Liming Wang and Mark A. Hasegawa-Johnson},
 title={Multimodal Word Discovery and Retrieval with Phone Sequence and Image Concepts},
 booktitle={Proc. Interspeech},
 year={2019},
 keywords={recognition},
 pages={2683--2687},
 doi={10.21437/Interspeech.2019-1487}
}

@inproceedings{hasegawajohnson2019position,
 author={Mark Hasegawa-Johnson and Najim Dehak and Odette Scharenborg},
 title={Position Paper: Indirect Supervision for Dialog Systems in Unwritten Languages},
 url={https://research.tudelft.nl/files/83277474/IWSDS_2019_Mark.pdf},
 booktitle={International Workshop on Spoken Dialog Systems},
 year={2019},
 keywords={recognition}
}

@inproceedings{scharenborg2018building,
 author={Odette Scharenborg and Patrick Ebel and Francesco Ciannella and Mark Hasegawa-Johnson and Najim Dehak},
 title={Building an ASR System for Mboshi Using a Cross-language Definition of Acoustic Units Approach},
 booktitle={Proc. SLTU (Speech and Language Technology for Under-resourced languages)},
 year={2018},
 keywords={recognition},
  pages={167--171},
  doi={10.21437/SLTU.2018-35}
}

@inproceedings{scharenborg2018linguistic,
 author={Odette Scharenborg and Laurent Besacier and Alan Black and Mark Hasegawa-Johnson and Florian Metze and Graham Neubig and Sebastian Stüker and Pierre Godard and Markus Müller and Lucas Ondel and Shruti Palaskar and Philip Arthur and Francesco Ciannella and Mingxing Du and Elin Larsen and Danny Merkx and Rachid Riad and Liming Wang and Emmanuel Dupoux},
 title={Linguistic Unit Discovery from Multi-Modal Inputs in Unwritten Languages: Summary of the Speaking Rosetta JSALT 2017 Workshop},
 doi={10.1109/ICASSP.2018.8461761},
 booktitle={Proc. ICASSP},
 year={2018},
 keywords={recognition}
}

@inproceedings{chen2018topic,
 author={Wenda Chen and Mark Hasegawa-Jonson and Nancy F.Y. Chen},
 title={Topic and Keyword Identification for Low-resourced Speech Using Cross-Language Transfer Learning},
 booktitle={Proc. Interspeech},
 year={2018},
 pages={2047--2051},
 doi={10.21437/Interspeech.2018-1283},
 keywords={recognition}
}

@inproceedings{hasegawajohnson2017image2speech:,
 author={Mark Hasegawa-Johnson and Alan Black and Lucas Ondel and Odette Scharenborg and Francesco Ciannella},
 title={Image2speech: Automatically generating audio descriptions of images},
 url={https://www.researchgate.net/profile/Kamel-Smaili-2/publication/354700462_INTERNATIONAL_CONFERENCE_ON_NATURAL_LANGUAGE_SIGNAL_AND_SPEECH_PROCESSING_Casablanca_2017_Morocco_Sponsor_ICNLSSP_International_Conference_on_Natural_Language_Signal_and_Speech_Processing/links/6148a03ea595d06017dd226b/INTERNATIONAL-CONFERENCE-ON-NATURAL-LANGUAGE-SIGNAL-AND-SPEECH-PROCESSING-Casablanca-2017-Morocco-Sponsor-ICNLSSP-International-Conference-on-Natural-Language-Signal-and-Speech-Processing.pdf#page=66},
 booktitle={Proc. Internat. Conference on Natural Language, Signal and Speech Processing (ICNLSSP)},
 year={2017},
 address={Casablanca, Morocco},
 keywords={recognition}
}

@inproceedings{zhuang2009speech,
 author={Xiaodan Zhuang and Jui-Ting Huang and Mark Hasegawa-Johnson},
 title={Speech Retrieval in Unknown Languages: a Pilot Study},
 url={https://aclanthology.org/W09-1602.pdf"},
 booktitle={NAACL HLT Cross-Lingual Information Access Workshop (CLIAWS)},
 pages={3-11},
 year={2009},
 grant={NSF 0703624},
 keywords={recognition}
}

@incollection{chen2007a,
 author={Ken Chen and Mark Hasegawa-Johnson and Jennifer Cole},
 title={A Factored Language Model for Prosody-Dependent Speech Recognition},
 url={http://www.intechopen.com/books/show/title/robust_speech_recognition_and_understanding},
 booktitle={Robust Speech Recognition and Understanding},
 editor={Michael Grimm and Kristian Kroschel},
 publisher={INTECH Publishing},
 pages={319-332},
 year={2007},
 keywords={recognition}
}

@article{hasegawajohnson2008prosodically,
 author={Mark Hasegawa-Johnson and Jennifer Cole and Ken Chen and Partha Lal and Amit Juneja and Taejin Yoon and Sarah Borys and Xiaodan Zhuang},
 title={Prosodically Organized Automatic Speech Recognition},
 journal={Language and Linguistics Monograph Series},
 volume={A25},
 publisher={Academica Sinica},
 address={Taiwan},
 year={2008},
 pages={101-128},
 grant={NSF 0414117},
 keywords={recognition}
}

@unpublished{hasegawajohnson2006phonology,
 author={Mark Hasegawa-Johnson},
 title={Phonology and the Art of Automatic Speech Recognition},
 note={Director's Seminar Series, Beckman Institute, University of Illinois at Urbana-Champaign},
 month={November},
 year={2006},
 grant={NSF 0414117},
 keywords={recognition}
}

@article{yoon2008voice,
 author={Taejin Yoon and Xiaodan Zhuang and Jennifer Cole and Mark Hasegawa-Johnson},
 title={Voice Quality Dependent Speech Recognition},
 journal={Language and Linguistics Monograph Series},
 volume={A25},
 publisher={Academica Sinica},
 address={Taiwan},
 year={2008},
 pages={77-100},
 grant={NSF 0414117},
 keywords={recognition}
}

@article{chen2006prosody,
 author={Ken Chen and Mark Hasegawa-Johnson and Aaron Cohen and Sarah Borys and Sung-Suk Kim and Jennifer Cole and Jeung-Yoon Choi},
 title={Prosody Dependent Speech Recognition on Radio News Corpus of American English},
 doi={10.1109/TSA.2005.853208},
 journal={IEEE Transactions on Speech and Audio Processing},
 volume={14},
 number={1},
 pages={232-245},
 year={2006},
 grant={NSF 0132900},
 keywords={recognition}
}

@article{hasegawajohnson2005simultaneous,
 author={Mark Hasegawa-Johnson and Ken Chen and Jennifer Cole and Sarah Borys and Sung-Suk Kim and Aaron Cohen and Tong Zhang and Jeung-Yoon Choi and Heejin Kim and Taejin Yoon and Sandra Chavarria},
 title={Simultaneous Recognition of Words and Prosody in the Boston University Radio Speech Corpus},
 doi={10.1016/j.specom.2005.01.009},
 journal=jsc,
 volume={46},
 number={3-4},
 pages={418-439},
 year={2005},
 grant={NSF 0132900},
 keywords={recognition}
}

@inproceedings{zhang2005a,
 author={Tong Zhang and Mark Hasegawa-Johnson and Stephen E. Levinson},
 title={A Hybrid Model for Spontaneous Speech Understanding},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=8110962ce5089070665624355945933b54b7e8eb},
 booktitle=aaai,
 year={2005},
 pages={10.1.1.80.879:1-8},
 grant={NSF 0085980},
 keywords={recognition}
}

@inproceedings{ren2004semantic,
 author={Yuexi Ren and Mark Hasegawa-Johnson and Stephen E. Levinson},
 title={Semantic analysis for a speech user interface in an intelligent-tutoring system},
 url={http://portal.acm.org/citation.cfm?doid=964442.964516},
 booktitle={Intl. Conf. on Intelligent User Interfaces},
 address={Madeira, Portugal},
 year={2004},
 grant={NSF 0085980},
 keywords={recognition}
}

@inproceedings{borys2004modeling,
 author={Sarah Borys and Mark Hasegawa-Johnson and Ken Chen and Aaron Cohen},
 title={Modeling and Recognition of Phonetic and Prosodic Factors for Improvements to Acoustic Speech Recognition Models},
 booktitle=interspeech,
 month={October},
 year={2004},
 grant={NSF 0132900},
 keywords={recognition},
 pages={3013--3016},
  doi={10.21437/Interspeech.2004-756}
} 

@phdthesis{chen2004prosody,
 author={Ken Chen},
 title={Prosody Dependent Speech Recognition on American Radio News Speech},
 url={https://www.ideals.illinois.edu/items/82155},
 year={2004},
 school={University of Illinois},
 keywords={recognition}
}

@unpublished{hasegawajohnson2004tsinghua,
 author={Mark Hasegawa-Johnson},
 title={Speech Recognition Models of the Interdependence Among Syntax, Prosody, and Segmental Acoustics},
 booktitle={talk given at Tsinghua University},
 month={October},
 year={2004},
 grant={NSF 0414117},
 keywords={recognition}
}

@inproceedings{hasegawajohnson2004hlt,
 author={Mark Hasegawa-Johnson and Jennifer Cole and Chilin Shih and Ken Chen and Aaron Cohen and Sandra Chavarria and Heejin Kim and Taejin Yoon and Sarah Borys and Jeung-Yoon Choi},
 title={Speech Recognition Models of the Interdependence Among Syntax, Prosody, and Segmental Acoustics},
 url={https://aclanthology.org/W04-3010/},
 booktitle={HLT/NAACL Workshop on Higher-Level Knowledge in Automatic Speech Recognition and Understanding},
 month={May},
 year={2004},
 pages={56-63},
 grant={NSF 0414117},
 keywords={recognition}
}

@inproceedings{chen2004how,
 author={Ken Chen and Mark Hasegawa-Johnson},
 title={How Prosody Improves Word Recognition},
 url={https://www.isca-speech.org/archive/speechprosody_2004/chen04c_speechprosody.html},
 booktitle={Speech Prosody},
 year={2004},
 address={Nara, Japan},
 month={March},
 pages={583-586},
 grant={NSF 0132900},
 keywords={recognition}
}

@inproceedings{chen2003wssp,
 author={Ken Chen and Mark Hasegawa-Johnson and Jennifer Cole},
 title={Prosody Dependent Speech Recognition on Radio News},
 doi={10.1109/TSA.2005.853208},
 booktitle={IEEE Workshop on Statistical Signal Processing},
 address={St. Louis, MO},
 year={2003},
 keywords={recognition}
}

@inproceedings{chen2003prosody,
 author={Ken Chen and Mark Hasegawa-Johnson and Aaron Cohen and Sarah Borys and Jennifer Cole},
 title={Prosody Dependent Speech Recognition with Explicit Duration Modelling at Intonational Phrase Boundaries},
 booktitle=interspeech,
 month={September},
 year={2003},
 pages={393-396},
 doi={10.21437/Eurospeech.2003-153},
 software={http://isle.illinois.edu/speech_web_lg/software/2003/Durhmm3.0.zip},
 keywords={recognition}
}

@unpublished{borys2003recognition,
 author={Sarah Borys},
 title={Recognition of Prosodic Factors and Detection of Landmarks for Improvements to Continuous Speech Recognition Systems},
 note={B.S. Thesis, University of Illinois},
 year={2003},
 keywords={recognition}
}

@inproceedings{sari2020deep,
 author={Leda Sar\i and Mark Hasegawa-Johnson},
 booktitle={Proc. Interspeech},
 year={2020},
 keywords={recognition},
  title={{Deep F-Measure Maximization for End-to-End Speech Understanding}},
  pages={1580--1584},
  doi={10.21437/Interspeech.2020-1949}
}

@inproceedings{borys2003the,
 author={Sarah Borys and Mark Hasegawa-Johnson and Jennifer Cole},
 title={The Importance of Prosodic Factors in Phoneme Modeling with Applications to Speech Recognition},
 booktitle={ACL Student Session},
 year={2003},
 grant={NSF 0132900},
 keywords={recognition}
}

@article{borys2003prosody,
 author={Sarah Borys and Mark Hasegawa-Johnson and Jennifer Cole},
 title={Prosody as a Conditioning Variable in Speech Recognition},
 url={https://www.researchgate.net/profile/Jennifer-Cole-6/publication/2842059_Prosody_As_A_Conditioning_Variable_In_Speech_Recognition/links/0912f50aa6042dd0bd000000/Prosody-As-A-Conditioning-Variable-In-Speech-Recognition.pdf},
 journal={Illinois Journal of Undergraduate Research},
 year={2003},
 keywords={recognition}
}

@article{hasegawajohnson2017asr,
 author={Mark Hasegawa-Johnson and Preethi Jyothi and Daniel McCloy and Majid Mirbagheri and Giovanni di Liberto and Amit Das and Bradley Ekin and Chunxi Liu and Vimal Manohar and Hao Tang and Edmund C. Lalor and Nancy Chen and Paul Hager and Tyler Kekona and Rose Sloan and Adrian KC Lee},
 title={{ASR} for Under-Resourced Languages from Probabilistic Transcription},
 journal={IEEE/ACM Trans. Audio, Speech and Language},
 volume={25},
 number={1},
 pages={46-59},
 year={2017},
 issn={2329-9290},
 doi={10.1109/TASLP.2016.2621659},
 keywords={recognition}
}

@inproceedings{chen2016clustering-based,
 author={Wenda Chen and Mark Hasegawa-Johnson and Nancy Chen and Preethi Jyothi and Lav Varshney},
 title={Clustering-based Phonetic Projection in Mismatched Crowdsourcing Channels for Low-resourced ASR},
 url={https://www.aclweb.org/anthology/W16-3714/},
 booktitle={WSSAP (Workshop on South and Southeast Asian Natural Language Processing)},
 year={2016},
 pages={133-141},
 keywords={recognition}
}

@unpublished{hasegawajohnson2015probabilistic,
 author={Mark Hasegawa-Johnson and Ed Lalor and KC LEe and Preethi Jyothi and Majid Mirbagheri and Amit Das and Giovannie Di Liberto and Brad Ekin and Chunxi Liu and Vimal Manohar and Hao Tang and Paul Hager and Tyler Kekona and Rose Sloan},
 title={Probabilistic Transcription},
 note={WS15 Group Final Presentation},
 year={2015},
 keywords={recognition}
}

@inproceedings{jyothi2015transcribing,
 author={Preethi Jyothi and Mark Hasegawa-Johnson},
 title={Transcribing Continuous Speech Using Mismatched Crowdsourcing},
 booktitle=interspeech,
 year={2015},
 pages={2774-2778},
 keywords={recognition},
 doi={10.21437/Interspeech.2015-584} 
}

@article{hasegawajohnson2015models,
 author={Mark Hasegawa-Johnson and Jennifer Cole and Preethi Jyothi and Lav Varshney},
 title={Models of Dataset Size, Question Design, and Cross-Language Speech Perception for Speech Crowdsourcing Applications},
 doi={10.1515/lp-2015-0012},
 journal={Journal of Laboratory Phonology},
 volume={6},
 number={3-4},
 pages={381-431},
 year={2015},
 keywords={recognition}
}

@inproceedings{jyothi2015acquiring,
 author={Preethi Jyothi and Mark Hasegawa-Johnson},
 title={Acquiring Speech Transcriptions Using Mismatched Crowdsourcing},
 doi={10.1609/aaai.v29i1.9343},
 booktitle={Proc. AAAI},
 year={2015},
 pages={1263-1269},
 keywords={recognition}
}

@unpublished{hasegawajohnson2012transfer,
 author={Mark Hasegawa-Johnson and David Harwath and Harsh Vardhan Sharma and Po-Sen Huang},
 title={Transfer Learning for Multi-Person and Multi-Dialect Spoken Language Interface},
 booktitle={presentation given at the 2012 Urbana Neuroengineering Conference},
 year={2012},
 keywords={recognition}
}

@inproceedings{huang2010semi-supervised,
 author={Jui-Ting Huang and Mark Hasegawa-Johnson},
 title={Semi-Supervised Training of Gaussian Mixture Models by Conditional Entropy Minimization},
 doi={10.21437/Interspeech.2008-116},
 booktitle={Proceedings of Interspeech},
 year={2010},
 pages={1353--1356},
 grant={NSF 0703624},
 keywords={recognition}
}

@inproceedings{ren2015classtranscribe:,
 author={Jia-Chen Ren and Lawrence Angrave and Mark Hasegawa-Johnson},
 title={ClassTranscribe: A New Tool with New Educational Opportunities for Student Crowdsourced College Lecture Transcriptions},
 url={https://www.isca-speech.org/archive/slate_2015/ren15_slate.html},
 booktitle={SLaTE (the Workshop on Speech and Language Technology in Education)},
 year={2015},
 keywords={recognition}
}

@inproceedings{chen2015classtranscribe,
 author={Jia Chen Ren and Mark Hasegawa-Johnson and Lawrence Angrave},
 title={ClassTranscribe},
 booktitle={ICER Conference},
 year={2015},
 keywords={recognition}
}

@inproceedings{hasegawajohnson2011multimodal,
 author={Mark Hasegawa-Johnson and Camille Goudeseune and Jennifer Cole and Hank Kaczmarski and Heejin Kim and Sarah King and Timothy Mahrt and Jui-Ting Huang and Xiaodan Zhuang and Kai-Hsiang Lin and Harsh Vardhan Sharma and Zhen Li and Thomas S. Huang},
 title={Multimodal Speech and Audio User Interfaces for {K-12} Outreach},
 url={http://www.apsipa.org/proceedings_2011/pdf/APSIPA256.pdf},
 booktitle={APSIPA},
 year={2011},
 pages={256:1-8},
 grant={NSF 0807329},
 keywords={recognition}
}

@inproceedings{harvill2021synthesis,
 author={John Harvill and Dias Issa and Mark Hasegawa-Johnson and Changdong Yoo},
 title={Synthesis of New Words for Improved Dysarthric Speech Recognition on an Expanded Vocabulary},
 doi={10.1109/ICASSP39728.2021.9414869},
 booktitle={Proc. ICASSP},
 year={2021},
 pages={6428-6432},
 keywords={recognition}
}

@inproceedings{morovelazquez2019study,
 author={Laureano Moro-Velazquez and JaeJin Cho and Shinji Watanabe and Mark A. Hasegawa-Johnson and Odette Scharenborg and Heejin Kim and Najim Dehak},
 keywords={recognition},
 title={{Study of the Performance of Automatic Speech Recognition Systems in Speakers with Parkinson’s Disease}},
 year=2019,
 booktitle={Proc. Interspeech 2019},
 pages={3875--3879},
 doi={10.21437/Interspeech.2019-2993}
}

@article{sharma2012csl,
 author={Harsh Vardhan Sharma and Mark Hasegawa-Johnson},
 title={Acoustic Model Adaptation using in-domain Background Models for Dysarthric Speech Recognition},
 doi={10.1016/j.csl.2012.10.002},
 journal={Computer Speech and Language},
 volume={27},
 number={6},
 month={September},
 year={2013},
 pages={1147–1162},
 keywords={recognition}
}

@phdthesis{sharma2012thesis,
 author={Harsh Vardhan Sharma},
 title={Acoustic Model Adaptation for Recognition of Dysarthric Speech},
 url={https://www.ideals.illinois.edu/items/32231},
 school={University of Illinois},
 year={2012},
 keywords={recognition}
}

@inproceedings{sharma2010state,
 author={Harsh Vardhan Sharma and Mark Hasegawa-Johnson},
 title={State Transition Interpolation and MAP Adaptation for HMM-based Dysarthric Speech Recognition},
 url={http://delivery.acm.org/10.1145/1870000/1867763/p72-sharma.pdf?key1=1867763&key2=2798521031&coll=DL&dl=ACM&ip=65.42.208.134&CFID=15366854&CFTOKEN=94985121},
 booktitle={HLT/NAACL Workshop on Speech and Language Processing for Assistive Technology (SLPAT)},
 pages={72-79},
 year={2010},
 grant={NSF 0534106},
 keywords={recognition}
}

@inproceedings{sharma2009universal,
 author={Harsh Vardhan Sharma and Mark Hasegawa-Johnson and Jon Gunderson and Adrienne Perlman},
 title={Universal Access: Speech Recognition for Talkers with Spastic Dysarthria},
 booktitle=interspeech,
 pages={1451--1454},
  doi={10.21437/Interspeech.2009-444},
  address={Brighton},
 month={September},
 year={2009},
 grant={NIH R21 DC008090A},
 keywords={recognition}
}

@inproceedings{kim2008dysarthric,
 author={Heejin Kim and Mark Hasegawa-Johnson and Adrienne Perlman and Jon Gunderson and Thomas Huang and Kenneth Watkin and Simone Frame},
 title={Dysarthric Speech Database for Universal Access Research},
  doi={10.21437/Interspeech.2008-480},
  booktitle=interspeech,
 year={2008},
 pages={1741-1744},
 grant={NIH DC008090A},
 keywords={recognition}
}

@inproceedings{zhu2007cellphone-based,
 author={Weimo Zhu and Mark Hasegawa-Johnson and Karen Chapman-Novakofski and Arthur Kantor},
 title={Cellphone-Based Nutrition E-Diary},
 booktitle={National Nutrient Database Conference},
 year={2007},
 keywords={recognition}
}

@inproceedings{zhu2007ecoder,
 author={Weimo Zhu and Mark Hasegawa-Johnson and Arthur Kantor and Dan Roth and Yong Gao and Youngsik Park and Lin Yang},
 title={E-coder for Automatic Scoring Physical Activity Diary Data: Development and Validation},
 booktitle={ACSM},
 year={2007},
 keywords={recognition}
}

@inproceedings{hasegawajohnson2006hmm-based,
 author={Mark Hasegawa-Johnson and Jonathan Gunderson and Adrienne Perlman and Thomas Huang},
 title={HMM-Based and SVM-Based Recognition of the Speech of Talkers with Spastic Dysarthria},
 doi={10.1109/ICASSP.2006.1660840},
 booktitle={ICASSP},
 pages={III:1060-3},
 month={May},
 year={2006},
 grant={NSF 0534106},
 keywords={recognition}
}

@inproceedings{kantor2005restricted,
 author={Arthur Kantor and Weimo Zhu and Mark Hasegawa-Johnson},
 title={Restricted domain speech classification using automatic transcription and SVMs},
 booktitle={Midwest Computational Linguistics Colloquium},
 year={2005},
 keywords={recognition}
}

@inproceedings{zhu2005accuracy,
 author={Weimo Zhu and Mark Hasegawa-Johnson and Mital Arun Gandhi},
 title={Accuracy of Voice-Recognition Technology in Collecting Behavior Diary Data},
 booktitle={Association of Test Publishers (ATP): Innovations in Testing},
 month={March},
 year={2005},
 keywords={recognition}
}

@inproceedings{kang2023end,
 author={Wonjune Kang and Mark Hasegawa-Johnson and Deb Roy},
 title={End-to-End Zero-Shot Voice Conversion with Location-Variable Convolutions},
 booktitle=interspeech,
 year={2023},
 keywords={synthesis}
}

@inproceedings{ni22_interspeech,
  author={Junrui Ni and Liming Wang and Heting Gao and Kaizhi Qian and Yang Zhang and Shiyu Chang and Mark Hasegawa-Johnson},
  title={{Unsupervised Text-to-Speech Synthesis by Unsupervised Automatic Speech Recognition}},
  year=2022,
  booktitle={Proc. Interspeech 2022},
  pages={461--465},
  doi={10.21437/Interspeech.2022-816}
}

@inproceedings{qian2021global,
 author={Kaizhi Qian and Yang Zhang and Shiyu Chang and Chuang Gan and David D. Cox and Mark Hasegawa-Johnson and Jinjun Xiong},
 title={Global Rhythm Style Transfer Without Text Transcriptions},
 url={http://proceedings.mlr.press/v139/qian21b/qian21b.pdf},
 booktitle={ICML},
 year={2021},
 keywords={synthesis}
}

@inproceedings{wang2021show,
 author={Xinsheng Wang and Siyuan Feng and Jihua Zhu and Mark Hasegawa-Johnson and Odette Scharenborg},
 title={Show and Speak: Directly Synthesize Spoken Description of Images},
 doi={10.1109/ICASSP39728.2021.9414021},
 booktitle={Proc. ICASSP},
 year={2021},
 keywords={synthesis}
}

@inproceedings{qian2020unsupervised,
 author={Kaizhi Qian and Yang Zhang and Shiyu Chang and Mark Hasegawa-Johnson and David Cox},
 title={Unsupervised Speech Decomposition via Triple Information Bottleneck},
 url={http://proceedings.mlr.press/v119/qian20a.html},
 demo={https://auspicious3000.github.io/SpeechSplit-Demo/},
 booktitle={Proc. International Conference on Machine Learning (ICML)},
 volume={119},
 pages={7836--7846},
 year={2020},
 keywords={synthesis}
}

@inproceedings{qian2020f0-consistent,
 author={Kaizhi Qian and Zeyu Jin and Mark Hasegawa-Johnson and Gautham Mysore},
 title={F0-Consistent Many-to-Many Non-Parallel Voice Conversion via Conditional Autoencoder},
 doi={10.1109/ICASSP40776.2020.9054734},
 booktitle={Proc. ICASSP},
 year={2020},
 pages={6284-6288},
 keywords={synthesis}
}

@article{qian2019autovc:,
 author={Kaizhi Qian and Yang Zhang and Shiyu Chang and Xuesong Yang and Mark Hasegawa-Johnson},
 title={AutoVC: Zero-Shot Voice Style Transfer with Only Autoencoder Loss},
 url={http://proceedings.mlr.press/v97/qian19c/qian19c.pdf},
 demo={https://auspicious3000.github.io/autovc-demo/},
 journal={Proceedings of Machine Learning Research},
 volume={97},
 pages={5210-5219},
 year={2019},
 keywords={synthesis}
}

@inproceedings{hasegawajohnson2018image2speech:,
 author={Mark Hasegawa-Johnson and Alan Black and Lucas Ondel and Odette Scharenborg and Francesco Ciannella},
 title={Image2speech: Automatically generating audio descriptions of images},
 url={https://www.researchgate.net/profile/Kamel-Smaili-2/publication/354700462_INTERNATIONAL_CONFERENCE_ON_NATURAL_LANGUAGE_SIGNAL_AND_SPEECH_PROCESSING_Casablanca_2017_Morocco_Sponsor_ICNLSSP_International_Conference_on_Natural_Language_Signal_and_Speech_Processing/links/6148a03ea595d06017dd226b/INTERNATIONAL-CONFERENCE-ON-NATURAL-LANGUAGE-SIGNAL-AND-SPEECH-PROCESSING-Casablanca-2017-Morocco-Sponsor-ICNLSSP-International-Conference-on-Natural-Language-Signal-and-Speech-Processing.pdf#page=66},
 booktitle={Journal of the International Science and General Applications (ISGA)},
 volume={1},
 number={1},
 year={2018},
 keywords={synthesis}
}

@inproceedings{zhang2015incorporating,
 author={Yang Zhang and Zhijian Ou and Mark Hasegawa-Johnson},
 title={Incorporating AM-FM effect in voiced speech for probabilistic acoustic tube model},
 doi={10.1109/WASPAA.2015.7336905},
 booktitle={Proc. WASPAA},
 year={2015},
 keywords={synthesis}
}

@inproceedings{zhang2014improvement,
 author={Yang Zhang and Zhijian Ou and Mark Hasegawa-Johnson},
 title={Improvement of Probabilistic Acoustic Tube Model for Speech Decomposition},
 doi={10.1109/ICASSP.2014.6855144},
 booktitle={ICASSP},
 year={2014},
 keywords={synthesis}
}

@inproceedings{zhuang2010a,
 author={Xiaodan Zhuang and Lijuan Wang and Frank Soong and Mark Hasegawa-Johnson},
 title={A Minimum Converted Trajectory Error ({MCTE}) Approach to High Quality Speech-to-Lips Conversion},
 booktitle={Proceedings of Interspeech},
 year={2010},
 pages={1736--1739},
 doi={10.21437/Interspeech.2010-498}, 
 grant={NSF 0703624},
 keywords={synthesis}
}

@article{huang2009sensitive,
 author={Thomas S. Huang and Mark A. Hasegawa-Johnson and Stephen M. Chu and Zhihong Zeng and Hao Tang},
 title={Sensitive Talking Heads},
 doi={10.1109/MSP.2009.932562},
 journal={IEEE Signal Processing Magazine},
 volume={26},
 number={4},
 pages={67-72},
 month={July},
 year={2009},
 keywords={synthesis}
}

@article{tang2008humanoid,
 author={Hao Tang and Yun Fu and Jilin Tu and Mark Hasegawa-Johnson and Thomas S. Huang},
 title={Humanoid Audio-Visual Avatar with Emotive Text-to-Speech Synthesis},
 doi={10.1109/TMM.2008.2001355},
 journal={IEEE Trans. Multimedia},
 volume={10},
 number={6},
 pages={969-981},
 year={2008},
 keywords={synthesis}
}

@inproceedings{tang2008real-time,
 author={Hao Tang and Yuxiao Hu and Yun Fu and Mark Hasegawa-Johnson and Thomas S. Huang},
 title={Real-time conversion from a single 2D face image to a 3D text-driven emotive audio-visual avatar},
 doi={10.1109/ICME.2008.4607657},
 booktitle={IEEE International Conference on Multimedia and Expo (ICME)},
 year={2008},
 pages={1205-1208},
 keywords={synthesis}
}

@inproceedings{tang2008two-stage,
 author={Hao Tang and Xi Zhou and Matthias Odisio and Mark Hasegawa-Johnson and Thomas Huang},
 title={Two-Stage Prosody Prediction for Emotional Text-to-Speech Synthesis},
 booktitle=interspeech,
 year={2008},
 pages={2138-2141},
  doi={10.21437/Interspeech.2008-554},
  grant={NSF 0426227},
 keywords={synthesis}
}

@inproceedings{tang2008eava:,
 author={Hao Tang and Yun Fu and Jilin Tu and Thomas Huang and Mark Hasegawa-Johnson},
 title={EAVA: A 3D Emotive Audio-Visual Avatar},
 doi={10.1109/WACV.2008.4544003},
 booktitle={IEEE Workshop on Applications of Computer Vision (IEEE WACV)},
 pages={1-6},
 year={2008},
 grant={NSF 0426227},
 keywords={synthesis}
}

@inproceedings{zhu2021multi-decoder,
 author={Junzhe Zhu and Raymond Yeh and Mark Hasegawa-Johnson},
 title={Multi-Decoder DPRNN: Source Separation for Variable Number of Speakers},
 doi={10.1109/ICASSP39728.2021.9414205},
 booktitle={Proc. ICASSP},
 year={2021},
 pages={3420-3424},
 keywords={synthesis}
}

@inproceedings{yian2018time-frequency,
 author={Teck Yian Lim and Raymond Yeh and Yijia Xu and Minh Do and Mark Hasegawa-Johnson},
 title={Time-Frequency Networks for Audio Super-Resolution},
 doi={10.1109/ICASSP.2018.8462049},
 booktitle={Proc. ICASSP},
 year={2018},
 keywords={synthesis}
}

@inproceedings{qian2018deep,
 author={Kaizhi Qian and Yang Zhang and Shiyu Chang and Xuesong Yang and Dinei Florencio and Mark Hasegawa-Johnson},
 title={Deep Learning Based Speech Beamforming},
 doi={10.1109/ICASSP.2018.8462430},
 booktitle={Proc. ICASSP},
 year={2018},
 pages={5389-5393},
 keywords={synthesis}
}

@inproceedings{zhang17j_interspeech,
  author={Yang Zhang and Dinei Florêncio and Mark Hasegawa-Johnson},
  title={{Glottal Model Based Speech Beamforming for ad-hoc Microphone Arrays}},
  year=2017,
  booktitle={Proc. Interspeech 2017},
  pages={2675--2679},
  doi={10.21437/Interspeech.2017-1659}
}

@inproceedings{qian2017speech,
 author={Kaizhi Qian and Yang Zhang and Shiyu Chang and Xuesong Yang and Dinei Florencio and Mark Hasegawa-Johnson},
 title={Speech Enhancement Using Bayesian Wavenet},
 booktitle={Proc. Interspeech},
 year={2017},
 keywords={synthesis},
  pages={2013--2017},
  doi={10.21437/Interspeech.2017-1672} 
}

@inproceedings{chan2022speech,
 author={Chak Ho Chan and Kaizhi Qian and Yang Zhang and Mark Hasegawa-Johnson},
 booktitle={ICASSP},
 title={SpeechSplit2.0: Unsupervised Speech Disentanglement for Voice Conversion without Tuning Autoencoder Bottlenecks},
 doi={10.1109/ICASSP43922.2022.9747763},
 url={https://doi.org/10.1109/ICASSP43922.2022.9747763},
 year={2022},
 pages={6332-6336}
 }

@inproceedings{wang2016use,
 author={Ruobai Wang and Yang Zhang and Zhijian Ou and Mark Hasegawa-Johnson},
 title={Use of Particle Filtering and MCMC for Inference in Probabilistic Acoustic Tube Model},
 doi={10.1109/SSP.2016.7551748},
 booktitle={IEEE Workshop on Statistical Signal Processing},
 year={2016},
 keywords={synthesis}
}

@article{huang2015joint,
 author={Po-Sen Huang and Minje Kim and Mark Hasegawa-Johnson and Paris Smaragdis},
 title={Joint Optimization of Masks and Deep Recurrent Neural Networks for Monaural Source Separation},
 doi={10.1109/TASLP.2015.2468583},
 url={https://arxiv.org/abs/1502.04149},
 journal={IEEE Trans. Audio, Speech and Language Processing},
 volume={23},
 number={12},
 pages={2136-2147},
 year={2015},
 keywords={synthesis}
}

@inproceedings{huang2014deep,
 author={Po-Sen Huang and Minje Kim and Paris Smaragdis and Mark Hasegawa-Johnson},
 title={Deep Learning for Monaural Speech Separation},
 doi={10.1109/ICASSP.2014.6853860},
 booktitle={ICASSP},
 year={2014},
 grant={ARO W911NF-09-1-0383},
 keywords={synthesis}
}

@inproceedings{huang2012singing-voice,
 author={Po-Sen Huang and Scott Deeann Chen and Paris Smaragdis and Mark Hasegawa-Johnson},
 title={Singing-Voice Separation from Monaural Recordings using Robust Principal Component Analysis},
 doi={10.1109/ICASSP.2012.6287816},
 booktitle={ICASSP},
 year={2012},
 grant={ARO W911NF-09-1-0383},
 keywords={synthesis}
}

@phdthesis{kim2010statistical,
 author={Lae-Hoon Kim},
 title={Statistical Model Based Multi-Microphone Speech Processing: Toward Overcoming Mismatch Problem},
 url={http://hdl.handle.net/2142/16839},
 month={August},
 year={2010},
 school={University of Illinois},
 keywords={synthesis}
}

@inproceedings{kim2010toward,
 author={Lae-Hoon Kim and Mark Hasegawa-Johnson},
 title={Toward Overcoming Fundamental Limitation in Frequency-Domain Blind Source Separation for Reverberant Speech Mixtures},
 doi={10.1109/ACSSC.2010.5757618},
 booktitle={Proceedings of Asilomar},
 year={2010},
 grant={NSF 0913188},
 keywords={synthesis}
}

@inproceedings{kim2010robust,
 author={Lae-Hoon Kim and Kyung-Tae Kim and Mark Hasegawa-Johnson},
 title={Robust Automatic Speech Recognition with Decoder Oriented Ideal Binary Mask Estimation},
 booktitle={Proceedings of Interspeech},
 year={2010},
 pages={2066--2069},
  doi={10.21437/Interspeech.2010-583}, 
 grant={NSF 0913188},
 keywords={synthesis}
}

@article{kim2010speech,
 author={Lae-Hoon Kim and Kyungtae Kim and Mark Hasegawa-Johnson},
 title={Speech enhancement beyond minimum mean squared error with perceptual noise shaping},
 journal=jasa,
 volume={127},
 number={3},
 pages={1817},
 doi={10.1121/1.3384190},
 year={2010},
 keywords={synthesis}
}

@inproceedings{kim2010joint,
 author={Lae-Hoon Kim and Mark Hasegawa-Johnson and Gerasimos Potamianos and Vit Libal},
 title={Joint Estimation of DOA and Speech Based on EM Beamforming},
 doi={10.1109/ICASSP.2010.5496144},
 booktitle={ICASSP},
 year={2010},
 keywords={synthesis}
}

@inproceedings{kim2009optimal,
 author={Lae-Hoon Kim and Mark Hasegawa-Johnson},
 title={Optimal Multi-Microphone Speech Enhancement in Cars},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=f43edc454be762b15b7b023f52f406c00f695b59},
 booktitle={DSP in Cars workshop},
 address={Dallas},
 month={July},
 year={2009},
 grant={NSF 0803219},
 keywords={synthesis}
}

@article{kim2008acoustic,
 author={Lae-Hoon Kim and Mark Hasegawa-Johnson and Jun-Seok Lim and Koeng-Mo Sung},
 title={Acoustic model for robustness analysis of optimal multipoint room equalization},
 doi={10.1121/1.2837285},
 journal=jasa,
 volume={123},
 number={4},
 pages={2043-2053},
 year={2008},
 keywords={synthesis}
}

@inproceedings{kim2008optimal,
 author={Lae-Hoon Kim and Mark Hasegawa-Johnson},
 title={Optimal Speech Estimator Considering Room Response as well as Additive Noise: Different Approaches in Low and High Frequency Range},
 doi={10.1109/ICASSP.2008.4518674},
 booktitle={ICASSP},
 pages={4573-4576},
 year={2008},
 keywords={synthesis}
}

@inproceedings{lee000035minimum,
 author={Bowon Lee and Mark Hasegawa-Johnson},
 title={Minimum Mean Squared Error A Posteriori Estimation of High Variance Vehicular Noise},
 url={https://citeseerx.ist.psu.edu/document?repid=rep1&type=pdf&doi=1d23cdbd3b402db72ed6ea907bdf7f54d3c9dc2e},
 booktitle={2007 Biennial on DSP for In-Vehicle and Mobile Systems},
 address={Istanbul},
 month={June},
 year={2007},
 grant={Motorola RPS19},
 keywords={synthesis}
}

@unpublished{hasegawajohnson2006dealing1,
 author={Mark Hasegawa-Johnson},
 title={Dealing with Acoustic Noise. Part II: Beamforming.},
 booktitle={Tutorial presentation given at WS06, Center for Language and Speech Processing},
 month={July},
 year={2006},
 keywords={synthesis}
}

@unpublished{hasegawajohnson2006dealing2,
 author={Mark Hasegawa-Johnson},
 title={Dealing with Acoustic Noise. Part I: Spectral Estimation.},
 booktitle={Tutorial presentation given at WS06, Center for Language and Speech Processing},
 month={July},
 year={2006},
 keywords={synthesis}
}

@unpublished{dupoux2017speaking,
 title={The Speaking Rosetta Stone - Discovering Grounded Linguistic Units for Languages without Orthography},
 note={Final report of the WS17 Frederick Jelinek Memorial Summer Workshop team},
 year={2017},
 author={Emmanuel Dupoux and Odette Scharenborg and Graham Neubig and Laurent Besacier and Mark Hasegawa-Johnson and Alan Black and Florian Metze and Sebastian St{\"{u}}ker},
 url={https://www.lti.cs.cmu.edu/2017-jelinek-workshop}
 }

@inproceedings{kim2006generalized,
 author={Lae-Hoon Kim and Mark Hasegawa-Johnson and Keung-Mo Sung},
 title={Generalized Optimal Multi-Microphone Speech Enhancement Using Sequential Minimum Variance Distortionless Response ({MVDR}) Beamforming and Postfiltering},
 doi={10.1109/ICASSP.2006.1660591},
 booktitle={ICASSP},
 pages={III:65-8},
 month={May},
 year={2006},
 keywords={synthesis}
}

@inproceedings{kim2005generalized,
 author={Lae-Hoon Kim and Mark Hasegawa-Johnson},
 title={Generalized multi-microphone spectral amplitude estimation based on correlated noise model},
 booktitle={119th Convention of the Audio Engineering Society},
 address={New York},
 month={October},
 year={2005},
 keywords={synthesis}
}

@inproceedings{gandhi2004source,
 author={Mital Gandhi and Mark Hasegawa-Johnson},
 title={Source Separation using Particle Filters},
 booktitle=interspeech,
 month={October},
 year={2004},
 keywords={synthesis},
 pages={2673--2676},
 doi={10.21437/Interspeech.2004-710}
}

@article{lee2003open,
 author={Bowon Lee and Mark Hasegawa-Johnson and Camille Goudeseune},
 title={Open Loop Multichannel Inversion of Room Impulse Response},
 doi={10.1121/1.4780198},
 journal=jasa,
 volume={113},
 number={4},
 pages={2202-2203},
 year={2003},
 keywords={synthesis}
}

@incollection{hasegawajohnson2002speech,
 author={Mark Hasegawa-Johnson and Abeer Alwan},
 title={Speech Coding: Fundamentals and Applications},
 booktitle={Wiley Encyclopedia of Telecommunications and Signal Processing},
 editor={J. Proakis},
 publisher={Wiley and Sons},
 address={NY},
 month={December},
 year={2002},
 grant={NSF 0132900},
 keywords={synthesis}
}

@misc{taniguchi1998speech,
 author={Tomohiko Taniguchi and Mark Johnson},
 title={Speech coding and decoding system},
 abstract={Transform stochastic codebook so that, after perceptual weighting, it will be orthogonal to the adaptive codebook},
 howpublished={United States Patent Number 5799131},
 url={https://patentimages.storage.googleapis.com/5e/54/26/3ff3894828a9d3/US5799131.pdf},
 month={August},
 year={1998},
 keywords={synthesis}
}

@misc{taniguchi1994speech,
 author={Tomohiko Taniguchi and Mark Johnson and Yasuji Ohta and Hideki Kurihara and Yoshinori Tanaka and Yoshihito Sakai},
 title={Speech coding system having codebook storing differential vectors between each two adjoining code vectors},
 howpublished={United States Patent Number 5323486},
 url={https://patentimages.storage.googleapis.com/6e/ac/fb/78352f241fd201/US5323486.pdf},
 month={June},
 year={1994},
 keywords={synthesis}
}

@misc{taniguchi1993speech1,
 author={Tomohiko Taniguchi and Mark Johnson},
 title={Speech coding system},
 abstract={hexagonal lattice},
 howpublished={United States Patent Number 5245662},
 url={https://patentimages.storage.googleapis.com/67/19/4e/63aa5e1e86ae4e/US5245662.pdf},
 month={September},
 year={1993},
 keywords={synthesis}
}

@misc{taniguchi1993speech2,
 author={Tomohiko Taniguchi and Mark Johnson and Hideki Kurihara and Yoshinori Tanaka and Yasuji Ohta},
 title={Speech coding and decoding system},
 abstract={sparse adaptive codebook},
 howpublished={United States Patent Number 5199076},
 url={https://patentimages.storage.googleapis.com/f5/8e/8f/fb388df1a25c93/US5199076.pdf},
 month={March},
 year={1993},
 keywords={synthesis}
}

@article{johnson1992on-line,
 author={Mark Johnson and Tomohiko Taniguchi},
 title={On-line and off-line computational reduction techniques using backward filtering in CELP speech coders},
 doi={10.1109/78.149977},
 journal={IEEE Transactions Acoustics, Speech, and Signal Processing},
 volume={40},
 pages={2090-2093},
 year={1992},
 keywords={synthesis}
}

@inproceedings{johnson1991low-complexity,
 author={Mark A. Johnson and Tomohiko Taniguchi},
 title={Low-complexity multi-mode VXC using multi-stage optimization and mode selection},
 doi={10.1109/ICASSP.1991.150317},
 booktitle={ICASSP},
 address={Toronto, Canada},
 pages={221-224},
 year={1991},
 keywords={synthesis}
}

@inproceedings{taniguchi1991pitch,
 author={Tomohiko Taniguchi and Mark A. Johnson and Yasuji Ohta},
 title={Pitch sharpening for perceptually improved CELP, and the sparse-delta codebook for reduced computation},
 doi={10.1109/ICASSP.1991.150322},
 booktitle={ICASSP},
 address={Toronto, Canada},
 pages={241-244},
 year={1991},
 keywords={synthesis}
}

@inproceedings{taniguchi1991improving,
 author={Tomohiko Taniguchi and Fumio Amano and Mark A. Johnson},
 title={Improving the performance of CELP-based speech coding at low bit rates},
 doi={10.1109/ISCAS.1991.176404},
 booktitle={International Symposium on Circuits and Systems},
 address={Singapore},
 year={1991},
 keywords={synthesis}
}

@inproceedings{johnson1990computational,
 author={Mark A. Johnson and Tomohiko Taniguchi},
 title={Computational reduction in sparse-codebook CELP using backward-weighting of the input},
 booktitle={Institute of Electr. and Information and Comm. Eng. Symposium DSP 90-15},
 address={Hakata},
 pages={61-66},
 year={1990},
 keywords={synthesis}
}

@inproceedings{taniguchi1990multi-vector,
 author={Tomohiko Taniguchi and Mark A. Johnson and Yasuji Ohta},
 title={Multi-vector pitch-orthogonal {LPC}: quality speech with low complexity at rates between 4 and 8 kbps},
 booktitle={ICSLP},
 address={Kobe},
 pages={113-116},
 year={1990},
 keywords={synthesis},
 doi={10.21437/ICSLP.1990-29} 
}

@inproceedings{johnson1990pitch-orthogonal,
 author={Mark A. Johnson and Tomohiko Taniguchi},
 title={Pitch-orthogonal code-excited {LPC}},
 doi={10.1109/GLOCOM.1990.116570},
 booktitle={IEEE Global Telecommunications Conference (GLOBECOM)},
 address={San Diego, CA},
 pages={542-546},
 year={1990},
 keywords={synthesis}
}

@inproceedings{huang00signal,
  author={Jun Huang and Stephen Levinson and Mark Hasegawa-Johnson},
  title={{Signal approximation in Hilbert space and its application on articulatory speech synthesis}},
  year=2000,
  booktitle={Proc. 6th International Conference on Spoken Language Processing (ICSLP 2000)},
  pages={vol. 2, 775-778},
  doi={10.21437/ICSLP.2000-384},
  keywords={synthesis}
}
@inproceedings{sakakini2020automatic,
 author={Tarek Sakakini and Jong Yoon Lee and Aditya Srinivasa and Renato Azevedo and Victor Sadauskas and Kuangxiao Gu and Suma Bhat and Dan Morrow and James Graumlich and Saqib Walayat and Mark Hasegawa-Johnson and Donald Wilpern and Ann Willemsen-Dunlap},
 title={Automatic Text Simplification of Health Materials in Low-Resource Domains},
 booktitle={LOUHI: 11th International Workshop on Health Text Mining and Information Analysis},
 url={https://louhi2020.fbk.eu/},
 year={2020},
 keywords={synthesis}
}

@inproceedings{morrow2020closing,
 author={Daniel Morrow and Renato F.L. Azevedo and Leda Sari and Kuangxiao Gu and Tarek Sakakini and Mark Hasegawa-Johnson and Suma Bhat and James Graumlich and Thomas Huang and Andrew Hariharan and Yunxin Shao and Elizabeth Cox},
 year={2020},
 title={Closing the Loop in Computer Agent/Patient Communication},
 booktitle={Proceedings of the 2020 Human Factors and Ergonomics Society Annual Meeting},
 address={Chicago, IL},
 keywords={synthesis}
}

@article{morrow2019contextualizing,
 author={Daniel Morrow and Renato Azevedo and Leitão Ferreira and Rocio Garcia-Retamero and Mark Hasegawa-Johnson and Thomas Huang and William Schuh and Kuangxiao Gu and Yang Zhang},
 title={Contextualizing numeric clinical test results for gist comprehension: Implications for {EHR} patient portals},
 journal={Journal of Experimental Psychology: Applied},
 volume={25},
 number={1},
 pages={41-61},
 year={2019},
 doi={10.1037/xap0000203},
 keywords={synthesis}
}

@inproceedings{azevedo2019the,
 author={Renato F.L. Azevedo and Dan Morrow and Kuangxiao Gu and Thomas Huang and Mark Hasegawa-Johnson and P. Soni and S. Tang and Tarek Sakakini and Suma Bhat and Ann Willemsen-Dunlap and James Graumlich},
 year={2019},
 title={The Influence of Computer Agent Characteristics on User Preferences in Health Contexts},
 booktitle={Proceedings of the 2019 Human Factors and Ergonomics Society Health Care Symposium},
 keywords={synthesis}
}

@inproceedings{azevedo2018using,
 author={Renato F. L. Azevedo and Dan Morrow and James Graumlich Ann Willemsen-Dunlap Mark Hasegawa-Johnson Thomas S. Huang and Kuangxiao Gu and Suma Bhat and Tarek Sakakini and Victor Sadauskas and Donald J. Halpin},
 title={Using conversational agents to explain medication instructions to older adults},
 url={https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6371340/},
 booktitle={AMIA Annu Symp Proc.},
 year={2018},
 pages={185–194},
 pmid={30815056},
 keywords={synthesis}
}

@inproceedings{azevedo2018computer,
 author={Renato Azevedo and Daniel G. Morrow and Kuangxiao Gu and  Thomas Huang and Mark Allan Hasegawa-Johnson and James Graumlich and Victor Sadauskas and Tarek J. Sakakini and Suma Pallathadka Bhat and Ann M. Willemsen-Dunlap and Donald J. Halpin},
 title={Computer Agents and Patient Memory for Medication Information},
 booktitle={APA Annual Meeting},
 year={2018},
 keywords={synthesis}
}

@article{morrow2018a,
 author={Daniel Morrow and Mark Hasegawa-Johnson and Thomas Huang and William Schuh and Renato Azevedo and Kuangxiao Gu and Yang Zhang and Bidisha Roy and Rocio Garcia-Retamero},
 title={A Multidisciplinary Approach to Designing and Evaluating Electronic Medical Record Portal Messages that Support Patient Self-Care},
 doi={10.1016/j.jbi.2017.03.015},
 journal={Journal of Biomedical Informatics},
 volume={69},
 pages={63-74},
 keywords={synthesis},
 year={2017},
 month={5}
}

@inproceedings{morrow2016multimedia,
 author={Daniel Morrow and Mark Hasegawa-Johnson and Thomas Huang and William Schuh and Rocio Garcia-Retamero and Renato Azevedo and Kuangxiao Gu and Yang Zhang and Bidisha Roy},
 title={Multimedia formats can improve older adult comprehension of clinical test results: Implications for Designing Patient Portals},
 booktitle={28th APS Annual Convention (Association for Psychological Science},
 month={May},
 year={2016},
 grant={AHRQ R21HS022948},
 keywords={synthesis}
}

@inproceedings{azevedo2015improving,
 author={Renato F. L. Azevedo and Daniel Morrow and Mark Hasegawa-Johnson and Kuangxiao Gu and Dan Soberal and Thomas Huang and William Schuh  and Rocio Garcia-Retamero},
 title={Improving Patient Comprehension of Numeric Health Information},
 booktitle={Human Factors Conference},
 year={2015},
 grant={AHRQ R21HS022948},
 keywords={synthesis}
}

@article{azevedo2024influence,
 title={The Influence of Memory for and Affective Response to Health Messages on Self-care Behavioral Intentions},
  volume={4},
  pages={100058},
  year={2023},
  publisher={Elsevier},
 author={Renato Azevedo and Rocio Garcia-Retamero and Mark Hasegawa-Johnson and Kuangxiao Gu and Danel G. Morrow},
 month={12},
 journal={Human Factors in Healthcare},
}

@inproceedings{huang2014singing-voice,
 author={Po-Sen Huang and Minje Kim and Mark Hasegawa-Johnson and Paris Smaragdis},
 title={Singing-Voice Separation From Monaural Recordings Using Deep Recurrent Neural Networks},
 url={https://archives.ismir.net/ismir2014/paper/000154.pdf},
 booktitle={Proceedings of ISMIR},
 year={2014},
 keywords={synthesis}
}

@article{paine2016fast,
 title={Fast wavenet generation algorithm},
 author={Paine, Tom Le and Khorrami, Pooya and Chang, Shiyu and Zhang, Yang and Ramachandran, Prajit and Hasegawa-Johnson, Mark A and Huang, Thomas S},
 journal={arXiv preprint arXiv:1611.09482},
 url={https://arxiv.org/abs/1611.09482},
 year={2016},
 keywords={synthesis}
}

@inproceedings{chang2023classification,
 title={Classification of Infant Sleep/Wake States: Cross-Attention Among Large Scale Pretrained Transformer Networks Using Audio, {ECG}, and {IMU} Data},
 author={Kai Chieh Chang and Mark Hasegawa-Johnson and Nancy L. McElwain and Bashima Islam},
 year={2023},
 booktitle={APSIPA ASC},
 url={https://arxiv.org/abs/2306.15808},
 month={11},
 keywords={multimodal signal understanding}
 }

@incollection{kim2020communication,
 author={Heejin Kim and Mark Hasegawa-Johnson},
 title={Communication Improves When Human or Computer Listeners Adapt to Dysarthria},
 booktitle={Acoustic Analysis of Pathologies: From Infancy to Young Adulthood},
 publisher={Walter De Gruyter, Inc.},
 address={Boston/Berlin},
 editor={Amy Neustein and Hemant Patil},
 year={2020},
 pages={181--197},
 doi={10.1515/9781501513138-005}
}

@phdthesis{bharadwaj2015theory,
 author={Sujeeth Bharadwaj},
 title={A theory of (almost) zero resource speech recognition},
 year={2015},
 month={June},
 school={University of Illinois},
 keywords={recognition},
 url={https://www.ideals.illinois.edu/items/79584}
}
 
@phdthesis{huang2015shallow,
 author={Po-Sen Huang},
 title={Shallow and deep learning for audio and natural language processing},
 year={2015},
 month={January},
 school={University of Illinois},
 keywords={audio},
 url={https://www.ideals.illinois.edu/items/79707}
}

@phdthesis{yang2019dealing,
 author={Xuesong Yang},
 title={Dealing with linguistic mismatches for automatic speech recognition},
 year={2019},
 month={May},
 school={University of Illinois},
 keywords={recognition},
 url={https://www.ideals.illinois.edu/items/112306}
}

@phdthesis{chen2019modeling,
 author={Wenda Chen},
 title={Modeling phones, keywords, topics and intents in spoken languages},
 year={2019},
 month={July},
 school={University of Illinois},
 keywords={recognition},
 url={https://www.ideals.illinois.edu/items/112912}
}

@phdthesis{qian2020deep,
 author={Kaizhi Qian},
 title={Deep generative models for speech editing},
 year={2020},
 month={November},
 school={University of Illinois},
 keywords={synthesis},
 url={https://www.ideals.illinois.edu/items/117215}
}

@phdthesis{sari2021learning,
 author={Leda Sar{\i}},
 title={Learning speech embeddings for speaker adaptation and speech understanding},
 year={2021},
 month={April},
 school={University of Illinois},
 keywords={recognition},
 url={https://www.ideals.illinois.edu/items/118278}
}

@phdthesis{fan2021sparse,
 author={Yuchen Fan},
 title={Sparse representation in deep vision models},
 year={2021},
 month={November},
 school={University of Illinois},
 keywords={vision},
 url={https://www.ideals.illinois.edu/items/123372}
}

@phdthesis{zhou2021towards,
 author={Yuqian Zhou},
 title={Towards practical deep learning based image restoration model},
 year={2021},
 month={November},
 school={University of Illinois},
 keywords={vision},
 url={https://www.ideals.illinois.edu/items/123259}
}

@phdthesis{abavisani2022role,
 author={Ali Abavisani},
 title={The role of talker change, vowel change and speech perceptual measure in hearing impaired phone recognition},
 year={2022},
 month={May},
 school={University of Illinois},
 keywords={recognition},
 url={https://www.ideals.illinois.edu/items/125380}
}

@phdthesis{thomas2023evolution,
 author={Oshane Odane Thomas},
 title={Evolution of primate cuboid form and the application of learning methods to the analysis of morphological and behavioral phenotypes},
 year={2023},
 month={June},
 school={University of Illinois},
 keywords={biomedical},
 url={https://www.ideals.illinois.edu/items/129109}
}

@phdthesis{wang2023multimodal,
 author={Liming Wang},
 title={Multimodal spoken unit discovery with paired and unpaired modalities},
 year={2023},
 month={May},
 school={University of Illinois},
 keywords={recognition},
 url={https://www.ideals.illinois.edu/items/128694}
}

@phdthesis{gao2024unsupervised,
 author={Heting Gao},
 title={Unsupervised speech technology for low-resource languages},
 year={2024},
 month={March},
 school={University of Illinois},
 keywords={recognition},
 url={https://www.ideals.illinois.edu/items/131276}
}

@phdthesis{harvill2024speech,
 author={John Harvill},
 title={Speech classification and lexical semantic modeling via self-supervision and knowledge transfer},
 year={2024},
 month={April},
 school={University of Illinois},
 keywords={recognition},
 url={https://www.ideals.illinois.edu/items/131435}
}

@phdthesis{li2024breaking,
 author={Jialu Li},
 title={Breaking down barriers: advancing interdisciplinary speech applications in early children’s development},
 year={2024},
 month={March},
 school={University of Illinois},
 keywords={biomedical},
 url={https://www.ideals.illinois.edu/items/131512}
}

@phdthesis{wang2024reasoning,
 author={Zhonghao Wang},
 title={Reasoning, scaling, generating with vision-language models},
 year={2024},
 month={March},
 school={University of Illinois},
 keywords={vision},
 url={https://www.ideals.illinois.edu/items/131362}
}

@mastersthesis{zhang2024end,
 title={End-to-end modeling for code-switching automatic speech recognition},
 author={Feiyu Zhang},
 year={2024},
 school={University of Illinois},
 url={https://www.ideals.illinois.edu/items/131716}
 }

@mastersthesis{chang2024fusing,
 title={Fusing multimodal neural networks: a study on sleep classification and sound event localization and detection},
 author={Kai Chieh Chang},
 year={2024},
 school={University of Illinois},
 url={https://www.ideals.illinois.edu/items/131693},
 }
 
@mastersthesis{lee2023explainable,
 author={Seunghyun Lee},
 url={https://www.ideals.illinois.edu/items/128583},
 title={Explainable artificial intelligence for inclusive automatic speech recognition},
 year={2023},
 school={University of Illinois},
 keywords={recognition}
 }
 
@mastersthesis{harvill2022dysarthric,
 author={John Harvill},
 title={Regularization for dysarthric speech recognition and telemedicine applications},
 url={https://www.ideals.illinois.edu/items/124579},
 school={University of Illinois},
 year={2022},
 keywords={recognition}
}

@mastersthesis{guan2022study,
 author={Haozhong Guan},
 school={University of Illinois},
 year={2022},
 title={Study on speech emotion recognition based on deep learning},
 url={https://www.ideals.illinois.edu/items/126694}
 }
 
@mastersthesis{morshed2022cross,
 author={Mahir Morshed},
 title={Cross-lingual articulation information transfer with progressive networks for speech recognition},
 url={https://www.ideals.illinois.edu/items/124791},
 school={University of Illinois},
 year={2022},
 keywords={recognition}
}

@mastersthesis{chan2022speech,
 author={Chak Ho Chan},
 title={SpeechSplit2: Disentangling Speech Information Streams without Exhaustive Bottleneck Fine-tuning},
 year={2022},
 school={University of Illinois},
 keywords={analysis},
 url={https://www.ideals.illinois.edu/items/118126}
 }

@unpublished{morshed2019spiral,
 author={Mahir Morshed},
 url={https://www.ideals.illinois.edu/items/111124},
 title={Spiral representations in end-to-end Bengali articulatory feature identification},
 year={2019},
 school={University of Illinois},.
 keywords={recognition},
 note={Unpublished B.S. Thesis}
 }
 
@mastersthesis{gao2021improving,
 author={Heting Gao},
 title={Improving multilingual speech recognition systems},
 url={https://www.ideals.illinois.edu/items/123250},
 school={University of Illinois},
 year={2021},
 keywords={recognition}
}

@mastersthesis{ramnath2021fact,
 title={Thumbnail for Fact-based visual question answering using knowledge graph embeddings
Fact-based visual question answering using knowledge graph embeddings},
 author={Kiran Ramnath},
 year={2021},
 school={University of Illinois},
 keywords={nlp},
 url={https://www.ideals.illinois.edu/items/118412}
 }
 
@mastersthesis{ni2021enforcing,
  title={Enforcing constraints for multi-lingual and cross-lingual speech-to-text systems},
  author={Ni, Junrui},
  year={2021},
  school={University of Illinois},
  url={https://www.ideals.illinois.edu/items/123289/bitstreams/406101/data.pdf}
}

@mastersthesis{zhu2020multi,
 author={Junzhe Zhu},
 url={https://www.ideals.illinois.edu/items/116889},
 year={2020},
 school={University of Illinois},
 title={Multi-decoder {DPRNN} high accuracy source counting and separation},
 keywords={enhancement}
 }

@mastersthesis{wu2020semi,
 author={Ningkai Wu},
 year={2020},
 school={University of Illinois},
 title={Semi-supervised cycle-consistency training for end-to-end ASR using unpaired speech},
 keywords={recognition},
 url={https://www.ideals.illinois.edu/items/115809}
 }
 
@mastersthesis{wang2020translation,
 author={Liming Wang},
 year={2020},
 school={University of Illinois},
 keywords={analysis},
 url={https://www.ideals.illinois.edu/items/115664},
 title={A translation framework for discovering word-like units from visual scenes and spoken descriptions}
 }

@mastersthesis{xu2019acoustic,
 author={Yijia Xu},
 title={Acoustic Event, Spoken Keyword and Emotional Outburst Detection},
 url={https://www.ideals.illinois.edu/items/112277},
 year={2019},
 school={University of Illinois},
 keywords={analysis}
}

@unpublished{wang2018multimodal,
 author={Liming Wang},
 year={2018},
 school={University of Illinois},
 keywords={analysis},
 url={https://www.ideals.illinois.edu/items/106072},
 title={Multimodal semantic learning with context-correlated speeches and images},
 note={Unpublished B.S. thesis}
 }

@mastersthesis{qian2018speech,
 author={Kaizhi Qian},
 url={https://www.ideals.illinois.edu/items/107741},
 year={2018},
 school={University of Illinois},
 keywords={enhancement},
 title={Speech enhancement using deep dilated {CNN}}
 }

@mastersthesis{zhu2017thumbnail,
 author={Tianyilin Zhu},
 title={Thumbnail for Lipreading with convolutional and recurrent neural network models
Lipreading with convolutional and recurrent neural network models},
 year={2017},
 school={University of Illinois},
 keywords={multimodal},
 url={https://www.ideals.illinois.edu/items/102816}
 }
 
@mastersthesis{yang2015machine,
 title={Machine learning approaches to improving mispronunciation detection on an imbalanced corpus},
 author={Xuesong Yang},
 year={2015},
 school={University of Illinois},
 keywords={recognition},
 url={https://www.ideals.illinois.edu/items/91251}
 }
 
@mastersthesis{zhang2015probabilistic,
 author={Yang Zhang},
 title={Probabilistic Generative Modeling of Speech},
 year={2015},
 school={University of Illinois},
 keywords={recognition},
 url={https://www.ideals.illinois.edu/items/91207}
 }

@mastersthesis{soberal2014face,
 author={Daniel Soberal},
 school={University of Illinois},
 year={2014},
 url={https://www.ideals.illinois.edu/items/73028},
 keywords={multimodal},
 title={Face recognition using hidden Markov model supervectors}
 }
 
@unpublished{qian2014regularized,
 author={Kaizhi Qian},
 url={https://www.ideals.illinois.edu/items/55611},
 year={2014},
 school={University of Illinois},
 note={Unpublished B.S. Thesis},
 title={Regularized Estimation of Gaussian Mixture Models for {SVM} Based Speaker Recognition}
 }

@unpublished{jones2014english,
 author={Jonathan Jones},
 year={2014},
 url={https://www.ideals.illinois.edu/items/55442},
 school={University of Illinois},
 note={Unpublished B.S. Thesis},
 title={English-Spanish Language Transfer for Automatic Speech Recognition}
 }
 
@mastersthesis{chen2014automatic,
 author={Austin Chen},
 title={Automatic Classification of Electronic Music and Speech/Music Audio Content},
 url={https://www.ideals.illinois.edu/items/49620},
 school={University of Illinois},
 year={2014},
 keywords={analysis}
}

@mastersthesis{bharadwaj2011multiview,
 author={Sujeeth Bharadwaj},
 year={2011},
 title={Multiview feature learning for speech recognition},
 school={University of Illinois},
 keywords={recognition},
 url={https://www.ideals.illinois.edu/items/30027}
 }
 
@mastersthesis{tidemann2011characterization,
 author={Jeremy Tidemann},
 title={Characterization of the Head-Related Transfer Function using Chirp and Maximum Length Sequence Excitation Signals},
 url={https://www.ideals.illinois.edu/items/25190},
 year={2011},
 school={University of Illinois},
 keywords={analysis}
}

@mastersthesis{huang2011non,
 title={Non-speech Acoustic Event Detection Using Multimodal Information},
 author={Po-Sen Huang},
 year={2011},
 school={University of Illinois},
 keywords={multimodal},
 url={https://www.ideals.illinois.edu/items/30083}
 }
 
@mastersthesis{hu2010thesis,
 author={Chi Hu},
 title={FSM-Based Pronunciation Modeling using Articulatory Phonological Code},
 url={https://www.ideals.illinois.edu/items/16794},
 year={2010},
 school={University of Illinois},
 keywords={recognition}
}

@unpublished{harwath2010phonetic,
 author={David Harwath},
 year={2010},
 school={University of Illinois},
 note={Unpublished B.S. Thesis},
 url={https://www.ideals.illinois.edu/items/47011},
 title={Phonetic Landmark Detection for Automatic Language Identification}
 }
 
@unpublished{bharadwaj2009advances,
 author={Sujeeth Bharadwaj},
 url={https://www.ideals.illinois.edu/items/47037},
 year={2009},
 note={Unpublished B.S. Thesis},
 school={University of Illinois},
 title={Advances in Sparse Classification}
 }
 
@mastersthesis{sharma2008universal,
 author={Harsh Vardhan Sharma},
 title={Universal Access: Experiments in Automatic Recognition of Dysarthric Speech}
 year={2008},
 school={University of Illinois},
 keywords={recognition}
}

@mastersthesis{borys2008scm,
 author={Sarah Borys},
 title={An SVM Front End Landmark Speech Recognition System},
 year={2008},
 school={University of Illinois},
 keywords={recognition}
}

@mastersthesis{li2008incremental,
 author={Yang Li},
 title={Incremental Training and Growth of Artificial Neural Networks},
 year={2008},
 school={University of Illinois},
 keywords={intelligence}
}

@mastersthesis{co2005room,
 author={Christopher Co},
 title={Room Reconstruction and Navigation Using Acoustically Obtained Room Impulse Responses and a Mobile Robot Platform},
 url={https://www.ideals.illinois.edu/items/42150},
 school={University of Illinois},
 year={2005},
 software={http://isle.illinois.edu/speech_web_lg/software/2013/co2013software.tgz},
 keywords={analysis}
}

@mastersthesis{cohen2004survey,
 author={Aaron Cohen},
 title={A Survey of Machine Learning Methods for Predicting Prosody in Radio Speech},
 school={University of Illinois},
 year={2004},
 keywords={analysis}
}

@mastersthesis{jing2002voice,
 author={Zhinian Jing},
 title={Voice Index and Frame Index for Recognition of Digits in Speech Background},
 year={2002},
 school={University of Illinois},
 keywords={recognition}
}

@mastersthesis{gunawan2000distributed,
 author={Wira Gunawan},
 title={Distributed Speech Recognition},
 year={2000},
 school={University of Illinois},
 keywords={recognition}
}

@mastersthesis{setsu2000articulatory,
 author={Jul Setsu Cha},
 title={Articulatory Speech Synthesis of Female and Male Talkers},
 school={UCLA},
 year={2000},
 keywords={synthesis}
}