2024
|
A. Das W. Quamer, R. Gutierrez-Osuna Speech synthesis and pronunciation teaching Book Chapter In: J. Levis C. A. Chapelle, M. Munro; Huensch, A. (Ed.): 2024. @inbook{nokey,
title = {Speech synthesis and pronunciation teaching},
author = {W. Quamer, A. Das, R. Gutierrez-Osuna},
editor = {C. A. Chapelle, J. Levis, M. Munro, C. Nagle, and A. Huensch},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2024/09/book-chapter-preprint.pdf},
year = {2024},
date = {2024-12-31},
urldate = {2024-12-31},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {inbook}
}
|
Quamer, W.; Gutierrez-Osuna, R. End-to-end streaming model for low-latency speech anonymization Proceedings Article In: Proc. IEEE Spoken Language Technology Workshop (SLT 2024), 2024. @inproceedings{nokey,
title = {End-to-end streaming model for low-latency speech anonymization},
author = {W. Quamer and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2024/09/waris2024slt.pdf},
year = {2024},
date = {2024-12-02},
urldate = {2024-12-02},
booktitle = {Proc. IEEE Spoken Language Technology Workshop (SLT 2024)},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
E. Do A. Das, N. Glanz; Gutierrez-Osuna, R. Macronutrient constraints and priors improve carbohydrate predictions from continuous glucose monitors Proceedings Article In: IEEE-EMBS International Conference on Body Sensor Networks (BSN'24), 2024. @inproceedings{nokey,
title = {Macronutrient constraints and priors improve carbohydrate predictions from continuous glucose monitors},
author = {A. Das, E. Do, N. Glanz, W. Bevier, R. Santiago, D. Kerr, B. Mortazavi and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2024/08/anurag-BSN24-macro.pdf},
year = {2024},
date = {2024-10-15},
booktitle = {IEEE-EMBS International Conference on Body Sensor Networks (BSN'24)},
keywords = {Continuous glucose monitors, Diabetes},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Das, A.; R. Gutierrez-Osuna, Improving mispronunciation detection using speech reconstruction Journal Article Forthcoming In: IEEE/ACM Transactions on Audio, Speech and Language Processing, Forthcoming. @article{nokey,
title = {Improving mispronunciation detection using speech reconstruction},
author = {A. Das and R. Gutierrez-Osuna,},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2024/07/anurag-taslp-2024.pdf},
year = {2024},
date = {2024-07-19},
journal = {IEEE/ACM Transactions on Audio, Speech and Language Processing},
keywords = {Accent conversion, Speech},
pubstate = {forthcoming},
tppubtype = {article}
}
|
Dave, D.; Vyas, K.; Branan, K.; McKay, S.; DeSalvo, D. J.; Gutierrez-Osuna, R.; Cote, G. L.; Erraguntla, M. Detection of hypoglycemia and hyperglycemia using ECG and accelerometer based non-invasive wearable sensors Journal Article In: Journal of Diabetes Science and Technology, vol. 18, iss. 2, 2024. @article{darpit2022jdst,
title = {Detection of hypoglycemia and hyperglycemia using ECG and accelerometer based non-invasive wearable sensors},
author = {D. Dave and K. Vyas and K. Branan and S. McKay and D. J. DeSalvo and R. Gutierrez-Osuna and G. L. Cote and M. Erraguntla},
url = {https://journals.sagepub.com/doi/full/10.1177/19322968221116393
https://psi.engr.tamu.edu/wp-content/uploads/2024/07/darpit-2024-jdst-1.pdf},
year = {2024},
date = {2024-07-16},
urldate = {2024-07-16},
journal = {Journal of Diabetes Science and Technology},
volume = {18},
issue = {2},
keywords = {Continuous glucose monitors, Diabetes, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
da C. Silva, D. R.; Gutierrez-Osuna, R. Does gamified breath-biofeedback promote adherence, relaxation, and skill transfer in the wild? Journal Article Forthcoming In: IEEE Transactions on Affective Computing, Forthcoming. @article{nokey,
title = {Does gamified breath-biofeedback promote adherence, relaxation, and skill transfer in the wild?},
author = {D. R. da C. Silva and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2024/07/Dennis-TAC-GBF-2024.pdf},
year = {2024},
date = {2024-07-15},
journal = {IEEE Transactions on Affective Computing},
keywords = {Games, Stress},
pubstate = {forthcoming},
tppubtype = {article}
}
|
R. Neiriz A. Silpachai, M. Novotny; Chukharey, E. Corrective feedback accuracy and pronunciation improvement: Feedback that is ‘good enough’ Journal Article In: Language Learning & Technology, vol. 28, iss. 1, pp. 1–16, 2024. @article{nokey,
title = {Corrective feedback accuracy and pronunciation improvement: Feedback that is ‘good enough’},
author = {A. Silpachai, R. Neiriz, M. Novotny, R. Gutierrez-Osuna, J. M. Levis and E. Chukharey
},
url = {https://hdl.handle.net/10125/73582https://psi.engr.tamu.edu/wp-content/uploads/2024/07/llt-2024-good-enough.pdf
https://hdl.handle.net/10125/73582},
year = {2024},
date = {2024-06-17},
journal = {Language Learning & Technology},
volume = {28},
issue = {1},
pages = {1–16},
keywords = {Speech},
pubstate = {published},
tppubtype = {article}
}
|
J. McMurray K. L. Branan, R. Jennings II Physiological sensing on the upper arm with a wireless multi-modal wearable Proceedings Article In: Optical Diagnostics and Sensing XXIV: Toward Point-of-Care Diagnostics, 2024. @inproceedings{nokey,
title = {Physiological sensing on the upper arm with a wireless multi-modal wearable},
author = {K. L. Branan, J. McMurray, R. Jennings II, M. Erraguntla, R. Gutierrez-Osuna, G. L. Coté
},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2024/07/kimberly-2024-biomonitor.pdf
https://www.spiedigitallibrary.org/conference-proceedings-of-spie/12850/128500D/Physiological-sensing-on-the-upper-arm-with-a-wireless-multi/10.1117/12.3003163.full},
year = {2024},
date = {2024-03-12},
booktitle = {Optical Diagnostics and Sensing XXIV: Toward Point-of-Care Diagnostics},
keywords = {Diabetes, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
2023
|
Sicong Huang Lida Zhang, Anurag Das Joint embedding of food photographs and blood blucose for improved calorie estimation Proceedings Article In: IEEE-EMBS Int. Conf. Body Sensor Networks (IEEE BSN) , 2023. @inproceedings{nokey,
title = {Joint embedding of food photographs and blood blucose for improved calorie estimation},
author = {Lida Zhang, Sicong Huang, Anurag Das, Edmund Do, Namino Glantz, Wendy Bevier, Rony Santiago, David Kerr, Ricardo Gutierrez-Osuna, Bobak J. Mortazavi
},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2023/11/photoCGM2023lida.pdf},
year = {2023},
date = {2023-10-09},
urldate = {2023-10-09},
booktitle = {IEEE-EMBS Int. Conf. Body Sensor Networks (IEEE BSN) },
journal = {Proc. IEEE-EMBS International Conference on Body Sensor Networks: Sensors and Systems for Digital Health (IEEE BSN) 2023},
keywords = {Continuous glucose monitors, Diabetes},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Anurag Das Edmund Do, Namino Glanz Modeling the effect of non-exercise activity thermogenesis on peak post-prandial glucose Proceedings Article In: IEEE-EMBS International Conference on Body Sensor Networks: Sensors and Systems for Digital Health (IEEE BSN) 2023
, 2023. @inproceedings{nokey,
title = {Modeling the effect of non-exercise activity thermogenesis on peak post-prandial glucose},
author = {Edmund Do, Anurag Das, Namino Glanz, Wendy Bevier, Rony Santiago, David Kerr, Ricardo Gutierrez-Osuna, Bobak J. Mortazavi},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2023/11/neat2023edmund.pdf},
year = {2023},
date = {2023-10-09},
urldate = {2023-10-09},
booktitle = {IEEE-EMBS International Conference on Body Sensor Networks: Sensors and Systems for Digital Health (IEEE BSN) 2023
},
keywords = {Continuous glucose monitors, Diabetes},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Carolina Villegas Kathan Vyas, Elizabeth Kubota-Mishra; Gutierrez-Osuna, Ricardo Detection of glycemic excursions using morphological and time-domain ECG features Proceedings Article In: IEEE-EMBS Intl. Conf. Body Sensor Networks(IEEE BSN) 2023
, 2023. @inproceedings{nokey,
title = {Detection of glycemic excursions using morphological and time-domain ECG features},
author = {Kathan Vyas, Carolina Villegas, Elizabeth Kubota-Mishra, Darpit Dave,
Madhav Erraguntla, Gerard Coté, Daniel J. DeSalvo, Siripoom McKay and Ricardo Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2023/11/hypoglycemia2023kathan.pdf},
year = {2023},
date = {2023-10-09},
booktitle = {IEEE-EMBS Intl. Conf. Body Sensor Networks(IEEE BSN) 2023
},
keywords = {Continuous glucose monitors, Diabetes},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Anurag Das Waris Quamer, Ricardo Gutierrez-Osuna Decoupling segmental and prosodic cues of non-native speech through vector quantization Proceedings Article In: Proc. Interspeech, 2023. @inproceedings{nokey,
title = {Decoupling segmental and prosodic cues of non-native speech through vector quantization},
author = {Waris Quamer, Anurag Das, Ricardo Gutierrez-Osuna
},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2023/11/decouplingProsody2023waris.pdf},
year = {2023},
date = {2023-08-20},
urldate = {2023-08-20},
booktitle = {Proc. Interspeech},
journal = {Interspeech 2023},
keywords = {Accent conversion, Speech, Voice conversion},
pubstate = {published},
tppubtype = {inproceedings}
}
|
da C. Silva, D. R.; Wang, Z.; Gutierrez-Osuna, R. Towards Participant-Independent Stress Detection Using Instrumented Peripherals Journal Article In: IEEE Transactions on Affective Computing, 2023. @article{dennis2021tac,
title = {Towards Participant-Independent Stress Detection Using Instrumented Peripherals},
author = {D. R. da C. Silva and Z. Wang and R. Gutierrez-Osuna},
url = {https://ieeexplore.ieee.org/document/9361293
https://psi.engr.tamu.edu/wp-content/uploads/2023/11/keyboard2023dennis.pdf},
year = {2023},
date = {2023-01-01},
urldate = {2021-02-05},
journal = {IEEE Transactions on Affective Computing},
keywords = {Health, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
Mortazavi, B. J.; Gutierrez-Osuna, R. A review of digital innovations for diet monitoring and precision nutrition Journal Article In: Journal of Diabetes Science and Technology, 2023. @article{,
title = {A review of digital innovations for diet monitoring and precision nutrition},
author = {B. J. Mortazavi and R. Gutierrez-Osuna},
url = {https://journals.sagepub.com/doi/full/10.1177/19322968211041356
https://psi.engr.tamu.edu/wp-content/uploads/2023/11/digitalInnovations2023bobak.pdf},
year = {2023},
date = {2023-01-01},
urldate = {2021-07-14},
journal = {Journal of Diabetes Science and Technology},
keywords = {Chemical sensors, Diabetes, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
2022
|
Ravuri, Vinesh; Gutierrez-Osuna, Ricardo; Chaspari, Theodora Preserving Mental Health Information in Speech Anonymization Proceedings Article In: 10th International Conference on Affective Computing & Intelligent Interaction (ACII2022)
, 2022. @inproceedings{nokey,
title = {Preserving Mental Health Information in Speech Anonymization},
author = {Vinesh Ravuri and Ricardo Gutierrez-Osuna and Theodora Chaspari},
url = {https://ieeexplore.ieee.org/abstract/document/10086012
https://psi.engr.tamu.edu/wp-content/uploads/2023/11/chaspari2022speechAnonimization.pdf},
year = {2022},
date = {2022-10-18},
urldate = {2022-10-18},
booktitle = {10th International Conference on Affective Computing & Intelligent Interaction (ACII2022)
},
keywords = {Mental health},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Husseini, D. Al; Lin, P. T.; Sukhishvili, S. A.; Zhou, J.; Li, J.; Lin, P. T.; Gutierrez-Osuna, R.; Coté, G. L. Silane-modified mesoporous silica nanocoatings for selective mid-infrared waveguide-based gas sensing Journal Article Forthcoming In: Advanced Materials Interfaces, Forthcoming. @article{diana2022mesoporous,
title = {Silane-modified mesoporous silica nanocoatings for selective mid-infrared waveguide-based gas sensing},
author = {D. Al Husseini and P. T. Lin and S. A. Sukhishvili and J. Zhou and J. Li and P. T. Lin and R. Gutierrez-Osuna and G. L. Coté},
year = {2022},
date = {2022-09-29},
journal = {Advanced Materials Interfaces},
keywords = {Chemical sensors},
pubstate = {forthcoming},
tppubtype = {article}
}
|
Quamer, W.; Das, A.; Levis, J.; Chukharev-Hudilainen, E.; Gutierrez-Osuna, R. Zero-Shot Foreign Accent Conversion without a Native Reference Proceedings Article Forthcoming In: Proc. Interspeech, Forthcoming. @inproceedings{waris2022interspeech,
title = {Zero-Shot Foreign Accent Conversion without a Native Reference},
author = {W. Quamer and A. Das and J. Levis and E. Chukharev-Hudilainen and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2023/02/quamer2022interspeech.pdf},
year = {2022},
date = {2022-09-18},
urldate = {2022-09-18},
booktitle = {Proc. Interspeech},
keywords = {Accent conversion, Deep learning, Speech},
pubstate = {forthcoming},
tppubtype = {inproceedings}
}
|
Zhou, J.; Husseini, D. Al; Li, J.; Lin, Z.; Sukhishvili, S.; Cote, G. L.; Gutierrez-Osuna, R.; Lin, P. T. Mid-Infrared Serial Microring Resonator Array for Real-time Detection of Vapor Phase Volatile Organic Compounds Journal Article Forthcoming In: Analytical Chemistry, Forthcoming. @article{junchao2022ac,
title = {Mid-Infrared Serial Microring Resonator Array for Real-time Detection of Vapor Phase Volatile Organic Compounds},
author = {J. Zhou and D. Al Husseini and J. Li and Z. Lin and S. Sukhishvili and G. L. Cote and R. Gutierrez-Osuna and P. T. Lin },
year = {2022},
date = {2022-07-19},
journal = {Analytical Chemistry},
keywords = {Chemical sensors, Infrared spectroscopy},
pubstate = {forthcoming},
tppubtype = {article}
}
|
Das, A.; Mortazavi, B.; Sajjadi, S.; Chaspari, T.; Ruebush, L. E.; Deutz, N. E.; Cote, G. L.; Gutierrez-Osuna, R. Predicting the macronutrient composition of mixed meals from dietary biomarkers in blood Journal Article In: IEEE Journal of Biomedical and Health Informatics, vol. 26, no. 6, pp. 2726-2736, 2022. @article{anurag2021aminoacids,
title = {Predicting the macronutrient composition of mixed meals from dietary biomarkers in blood},
author = {A. Das and B. Mortazavi and S. Sajjadi and T. Chaspari and L. E. Ruebush and N. E. Deutz and G. L. Cote and R. Gutierrez-Osuna},
url = {https://ieeexplore.ieee.org/document/9645322
https://psi.engr.tamu.edu/wp-content/uploads/2021/12/jbhi-aminoacids-2021-preprint.pdf},
year = {2022},
date = {2022-06-04},
urldate = {2021-12-05},
journal = {IEEE Journal of Biomedical and Health Informatics},
volume = {26},
number = {6},
pages = {2726-2736},
keywords = {Chemical sensors, Continuous glucose monitors, Health, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
Liberatore, C.; Gutierrez-Osuna, R. Minimizing residuals for native-nonnative voice conversion in a sparse, anchor-based representation of speech Proceedings Article In: Proc. ICASSP, 2022. @inproceedings{liberatore2022icassp,
title = {Minimizing residuals for native-nonnative voice conversion in a sparse, anchor-based representation of speech},
author = {C. Liberatore and R. Gutierrez-Osuna},
year = {2022},
date = {2022-05-22},
booktitle = {Proc. ICASSP},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Yang, M.; Dave, D.; Erraguntla, M.; Cote, G.; Gutierrez-Osuna, R. Joint hypoglycemia prediction and glucose forecasting via deep multi-task learning Proceedings Article In: Proc. ICASSP, 2022. @inproceedings{mu2022icassp,
title = {Joint hypoglycemia prediction and glucose forecasting via deep multi-task learning},
author = {M. Yang and D. Dave and M. Erraguntla and G. Cote and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2023/07/yang2022icassp_hypoglycemia.pdf
https://ieeexplore.ieee.org/document/9746129},
year = {2022},
date = {2022-05-22},
urldate = {2022-05-22},
booktitle = {Proc. ICASSP},
keywords = {Continuous glucose monitors, Deep learning, Health, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Paul, Sudip; Sharma, Rohit; Tathireddy, Prashant; Gutierrez-Osuna, Ricardo On-line drift-compensation for continuous monitoring with arrays of cross-sensitive chemical sensors Journal Article Forthcoming In: Sensors and Actuators B: Chemical, Forthcoming. @article{sudip-2022sab,
title = {On-line drift-compensation for continuous monitoring with arrays of cross-sensitive chemical sensors},
author = {Sudip Paul and Rohit Sharma and Prashant Tathireddy and Ricardo Gutierrez-Osuna},
year = {2022},
date = {2022-05-17},
journal = {Sensors and Actuators B: Chemical},
keywords = {Chemical sensors},
pubstate = {forthcoming},
tppubtype = {article}
}
|
Zhou, Junchao; Husseini, Diana Al; Li, Junyan; Lin, Zhihai; Sukhishvili, Svetlana; Coté, Gerard L.; Gutierrez-Osuna, Ricardo; Lin, Pao Tai Detection of Volatile Organic Compounds Using Mid-Infrared Silicon Nitride Waveguide Sensors Journal Article In: Scientific Reports, vol. 12, no. 5572 , 2022. @article{junchao-2022-scirep,
title = {Detection of Volatile Organic Compounds Using Mid-Infrared Silicon Nitride Waveguide Sensors},
author = {Junchao Zhou and Diana Al Husseini and Junyan Li and Zhihai Lin and Svetlana Sukhishvili and Gerard L. Coté and Ricardo Gutierrez-Osuna and Pao Tai Lin},
url = {https://www.nature.com/articles/s41598-022-09597-9
https://psi.engr.tamu.edu/wp-content/uploads/2022/04/s41598-022-09597-9.pdf},
year = {2022},
date = {2022-03-15},
urldate = {2022-03-15},
journal = {Scientific Reports},
volume = { 12},
number = {5572 },
keywords = {Chemical sensors},
pubstate = {published},
tppubtype = {article}
}
|
Branan, Kimberly L.; Reyes, Gilberto O. Flores; Abel, John A.; Erraguntla, Madhav; Gutierrez-Osuna, Ricardo; Coté, Gerard L. Multi-modal physiological sensing on the upper arm Proceedings Article In: Proc. SPIE, 2022. @inproceedings{kimberly2022spie,
title = {Multi-modal physiological sensing on the upper arm},
author = {Kimberly L. Branan and Gilberto O. Flores Reyes and John A. Abel and Madhav Erraguntla and Ricardo Gutierrez-Osuna and Gerard L. Coté},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2022/04/1195608.pdf},
year = {2022},
date = {2022-03-02},
urldate = {2022-03-02},
booktitle = {Proc. SPIE},
journal = {Proceedings of SPIE},
volume = {11956},
keywords = {Continuous glucose monitors, Health, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
2021
|
Chakravarthy, N. V.; Silva, D. R. Da Cunha; Gutierrez-Osuna, R. Evaluating the role of breathing guidance on game-based interventions for relaxation training Journal Article In: Frontiers in Digital Health, 2021. @article{nitin2021digitalhealth,
title = {Evaluating the role of breathing guidance on game-based interventions for relaxation training},
author = {N. V. Chakravarthy and D. R. Da Cunha Silva and R. Gutierrez-Osuna},
url = {https://www.frontiersin.org/articles/10.3389/fdgth.2021.760268/abstract
https://psi.engr.tamu.edu/wp-content/uploads/2021/12/nitin2021frontiers.pdf},
year = {2021},
date = {2021-11-18},
urldate = {2021-11-18},
journal = {Frontiers in Digital Health},
keywords = {Games, Health, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
Ding, S.; Zhao, G.; Gutierrez-Osuna, R. Accentron: Foreign accent conversion to arbitrary non-native speakers using zero-shot learning Journal Article In: Computer Speech & Language, 2021. @article{shaojin2021accentron,
title = {Accentron: Foreign accent conversion to arbitrary non-native speakers using zero-shot learning},
author = {S. Ding and G. Zhao and R. Gutierrez-Osuna},
url = {https://www.sciencedirect.com/science/article/pii/S0885230821001029
https://psi.engr.tamu.edu/wp-content/uploads/2021/10/1-s2.0-S0885230821001029-main.pdf},
year = {2021},
date = {2021-10-14},
urldate = {2021-10-14},
journal = {Computer Speech & Language},
keywords = {Accent conversion, Deep learning, Speech},
pubstate = {published},
tppubtype = {article}
}
|
Hair, A.; Zhao, G.; Ahmed, B.; Ballard, K. J.; Gutierrez-Osuna, R. Assessing Posterior-Based Mispronunciation Detection on Field-Collected Recordings from Child Speech Therapy Sessions Proceedings Article In: Proc. Interspeech, 2021. @inproceedings{adam2021interspeech,
title = {Assessing Posterior-Based Mispronunciation Detection on Field-Collected Recordings from Child Speech Therapy Sessions},
author = {A. Hair and G. Zhao and B. Ahmed and K. J. Ballard and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2021/08/hair_interspeech_2021.pdf},
year = {2021},
date = {2021-08-30},
booktitle = {Proc. Interspeech},
keywords = {Automatic Speech Recognition, Childhood apraxia of speech, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Silpachai, A.; Rehman, I.; Barriuso, T. A.; Levis, J.; Chukharev-Hudilainen, E.; Zhao, G.; Gutierrez-Osuna, R. Effects Of Voice Type And Task On L2 Learners’ Awareness Of Pronunciation Errors Proceedings Article In: Proc. Interspeech, 2021. @inproceedings{alif2021interspeech,
title = {Effects Of Voice Type And Task On L2 Learners’ Awareness Of Pronunciation Errors},
author = {A. Silpachai and I. Rehman and T. A. Barriuso and J. Levis and E. Chukharev-Hudilainen and G. Zhao and R. Gutierrez-Osuna},
year = {2021},
date = {2021-08-30},
booktitle = {Proc. Interspeech},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Liberatore, C.; Gutierrez-Osuna, R. An Exemplar Selection Algorithm For Native-Nonnative Voice Conversion Proceedings Article In: Proc. Interspeech, 2021. @inproceedings{chris2021ARS,
title = {An Exemplar Selection Algorithm For Native-Nonnative Voice Conversion},
author = {C. Liberatore and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2022/07/liberatore21_interspeech.pdf},
year = {2021},
date = {2021-08-30},
urldate = {2021-08-30},
booktitle = {Proc. Interspeech},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Yang, M.; Paromita, P.; Chaspari, T.; Das, A.; Sajjadi, S.; Mortazavi, B. J.; Gutierrez-Osuna, R. A Metric Learning Approach for Personalized Meal Macronutrient Estimation from Postprandial Glucose Response Signals Proceedings Article In: Proc. IEEE/EMBS Intl. Conf. Biomedical And Health Informatics (BHI 2021)., 2021. @inproceedings{theodora2021bhi,
title = {A Metric Learning Approach for Personalized Meal Macronutrient Estimation from Postprandial Glucose Response Signals},
author = {M. Yang and P. Paromita and T. Chaspari and A. Das and S. Sajjadi and B. J. Mortazavi and R. Gutierrez-Osuna},
url = {http://ceur-ws.org/Vol-2903/IUI21WS-HEALTHI-10.pdf
https://psi.engr.tamu.edu/wp-content/uploads/2022/01/IUI21WS-HEALTHI-10.pdf},
year = {2021},
date = {2021-07-27},
urldate = {2021-07-27},
booktitle = {Proc. IEEE/EMBS Intl. Conf. Biomedical And Health Informatics (BHI 2021).},
keywords = {Chemical sensors, Continuous glucose monitors, Deep learning, Health, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Hagve, M.; Simbo, S. Y.; Ruebush, L. E.; Engelen, M. P. K. J.; Gutierrez-Osuna, R.; Mortazavi, B. J.; Cote, G. L.; Deutz, N. E. P. Postprandial concentration of circulating branched chain amino acids are able to predict the carbohydrate content of the ingested mixed meal Journal Article In: Clinical Nutrition, 2021. @article{martin2021clinicalnutrition,
title = {Postprandial concentration of circulating branched chain amino acids are able to predict the carbohydrate content of the ingested mixed meal},
author = {M. Hagve and S. Y. Simbo and L. E. Ruebush and M. P. K. J. Engelen and R. Gutierrez-Osuna and B. J. Mortazavi and G. L. Cote and N. E. P. Deutz},
url = {https://www.sciencedirect.com/science/article/pii/S0261561421003502
https://psi.engr.tamu.edu/wp-content/uploads/2021/07/1-s2.0-S0261561421003502-main.pdf},
year = {2021},
date = {2021-07-13},
journal = {Clinical Nutrition},
keywords = {Chemical sensors, Continuous glucose monitors, Health, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
Zhao, G.; Ding, S.; Gutierrez-Osuna, R. Converting Foreign Accent Speech Without a Reference Journal Article In: IEEE/ACM Transactions on Audio, Speech, and Language Processing, vol. 29, pp. 2367, 2021. @article{guanlong2021reference-free,
title = {Converting Foreign Accent Speech Without a Reference},
author = {G. Zhao and S. Ding and R. Gutierrez-Osuna},
url = {https://ieeexplore.ieee.org/abstract/document/9477581
https://psi.engr.tamu.edu/wp-content/uploads/2021/08/zhao2021reference.pdf},
year = {2021},
date = {2021-07-01},
urldate = {2021-07-01},
journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
volume = {29},
pages = {2367},
keywords = {Accent conversion, Deep learning, Speech},
pubstate = {published},
tppubtype = {article}
}
|
Das, A.; Mortazavi, B.; Chaspari, T.; Sajjadi, S.; Paromita, P.; Ruebush, L.; Deutz, N.; Gutierrez-Osuna, R. A sparse coding approach to automatic diet monitoring with continuous glucose monitors Proceedings Article In: In Proc. ICASSP, 2021. @inproceedings{anurag2021icassp,
title = {A sparse coding approach to automatic diet monitoring with continuous glucose monitors},
author = {A. Das and B. Mortazavi and T. Chaspari and S. Sajjadi and P. Paromita and L. Ruebush and N. Deutz and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2021/08/ICASSP_2021_AnuragDas.pdf},
year = {2021},
date = {2021-06-06},
booktitle = {In Proc. ICASSP},
keywords = {Chemical sensors, Continuous glucose monitors, Health, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Sajjadi, S.; Mortazavi, B. J.; Das, A.; Chaspari, T.; Paromita, P.; Ruebush, L. E.; Deutz, N. E.; Gutierrez-Osuna, R. Towards the development of subject-independent inverse metabolic models Proceedings Article In: In Proc. ICASSP, 2021. @inproceedings{hooman2021icassp,
title = {Towards the development of subject-independent inverse metabolic models},
author = {S. Sajjadi and B. J. Mortazavi and A. Das and T. Chaspari and P. Paromita and L. E. Ruebush and N. E. Deutz and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2021/08/ICASSP_21_SubjectIndependentIMM_CameraReady.pdf},
year = {2021},
date = {2021-06-06},
booktitle = {In Proc. ICASSP},
keywords = {Chemical sensors, Continuous glucose monitors, Health, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Paromita, P.; Chaspari, T.; Sajjadi, S.; Das, A.; Mortazavi, B. J.; Gutierrez-Osuna, R. Personalized Meal Classification Using Continuous Glucose Monitors Proceedings Article In: In Proc. IUI HEALTHI Workshop, 2021. @inproceedings{psyche2021healthi,
title = {Personalized Meal Classification Using Continuous Glucose Monitors},
author = {P. Paromita and T. Chaspari and S. Sajjadi and A. Das and B. J. Mortazavi and R. Gutierrez-Osuna},
year = {2021},
date = {2021-04-13},
urldate = {2021-04-13},
booktitle = {In Proc. IUI HEALTHI Workshop},
keywords = {Chemical sensors, Continuous glucose monitors, Deep learning, Health, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Hair, A.; Ballard, K. J.; Markoulli, C.; Monroe, P.; McKechnie, J.; Ahmed, B.; Gutierrez-Osuna, R. A Longitudinal Evaluation of Tablet-Based Child Speech Therapy with Apraxia World Journal Article In: ACM Transactions On Accessible Computing, vol. 14, no. 1, 2021. @article{adam2021TACCESS,
title = {A Longitudinal Evaluation of Tablet-Based Child Speech Therapy with Apraxia World},
author = {A. Hair and K. J. Ballard and C. Markoulli and P. Monroe and J. McKechnie and B. Ahmed and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2021/08/hair_taccess_2021.pdf},
doi = {10.1145/3433607},
year = {2021},
date = {2021-03-15},
journal = {ACM Transactions On Accessible Computing},
volume = {14},
number = {1},
abstract = {Digital games can make speech therapy exercises more enjoyable for children and increase their motivation during therapy. However, many such games developed to date have not been designed for long-term use. To address this issue, we developed Apraxia World, a speech therapy game specifically intended to be played over extended periods. In this study, we examined pronunciation improvements, child engagement over time, and caregiver and automated pronunciation evaluation accuracy while using our game over a multi-month period. Ten children played Apraxia World at home during two counterbalanced four-week treatment blocks separated by a two-week break. In one treatment phase, children received pronunciation feedback from caregivers and in the other treatment phase, utterances were evaluated with an automated framework built into the game. We found that children made therapeutically significant speech improvements while using Apraxia World, and that the game successfully increased engagement during speech therapy practice. Additionally, in offline mispronunciation detection tests, our automated pronunciation evaluation framework outperformed a traditional method based on goodness of pronunciation scoring. Our results suggest that this type of speech therapy game is a valid complement to traditional home practice.},
keywords = {Games, Health, Speech},
pubstate = {published},
tppubtype = {article}
}
Digital games can make speech therapy exercises more enjoyable for children and increase their motivation during therapy. However, many such games developed to date have not been designed for long-term use. To address this issue, we developed Apraxia World, a speech therapy game specifically intended to be played over extended periods. In this study, we examined pronunciation improvements, child engagement over time, and caregiver and automated pronunciation evaluation accuracy while using our game over a multi-month period. Ten children played Apraxia World at home during two counterbalanced four-week treatment blocks separated by a two-week break. In one treatment phase, children received pronunciation feedback from caregivers and in the other treatment phase, utterances were evaluated with an automated framework built into the game. We found that children made therapeutically significant speech improvements while using Apraxia World, and that the game successfully increased engagement during speech therapy practice. Additionally, in offline mispronunciation detection tests, our automated pronunciation evaluation framework outperformed a traditional method based on goodness of pronunciation scoring. Our results suggest that this type of speech therapy game is a valid complement to traditional home practice. |
Parnandi, A.; Gutierrez-Osuna, R. Partial reinforcement in game biofeedback for relaxation training Journal Article In: IEEE Transactions on Affective Computing, vol. 12, no. 1, pp. 141-153, 2021. @article{parnandi2018taffc,
title = {Partial reinforcement in game biofeedback for relaxation training},
author = {A. Parnandi and R. Gutierrez-Osuna },
url = {https://ieeexplore.ieee.org/document/8400398
https://psi.engr.tamu.edu/wp-content/uploads/2021/02/08400398.pdf},
year = {2021},
date = {2021-02-28},
journal = {IEEE Transactions on Affective Computing},
volume = {12},
number = {1},
pages = {141-153},
keywords = {Electrodermal activity, Games, Health, Heart rate variability, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
Husseini, D. Al; Karanth, Y.; Zhou, J.; Willhelm, D.; Qian, X.; Gutierrez-Osuna, R.; Coté, G. L.; and P. Tai Lin,; Sukhishvili, S. A. Surface Functionalization Utilizing Mesoporous Silica Nanoparticles for Enhanced Evanescent-Field Mid-Infrared Waveguide Gas Sensing Journal Article In: Coatings, vol. 11, no. 118, pp. 1-12, 2021. @article{alhusseini2021coatings,
title = {Surface Functionalization Utilizing Mesoporous Silica Nanoparticles for Enhanced Evanescent-Field Mid-Infrared Waveguide Gas Sensing},
author = {D. Al Husseini and Y. Karanth and J. Zhou and D. Willhelm and X. Qian and R. Gutierrez-Osuna and G. L. Coté and and P. Tai Lin and S. A. Sukhishvili},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2021/01/ahhusseini2021coatings.pdf
https://www.mdpi.com/2079-6412/11/2/118},
year = {2021},
date = {2021-01-21},
journal = {Coatings},
volume = {11},
number = {118},
pages = {1-12},
keywords = {Chemical sensors, Infrared spectroscopy},
pubstate = {published},
tppubtype = {article}
}
|
2020
|
Ahmed, B; Zafar, M; Rihawi, R; Gutierrez-Osuna, R Gaming away stress: Using biofeedback games to learn paced breathing Journal Article In: IEEE Transactions on Affective Computing, vol. 11, no. 3, pp. 519-531, 2020. @article{ahmed2018tac,
title = {Gaming away stress: Using biofeedback games to learn paced breathing},
author = {B Ahmed and M Zafar and R Rihawi and R Gutierrez-Osuna},
url = {https://ieeexplore.ieee.org/document/8319498},
year = {2020},
date = {2020-12-02},
journal = {IEEE Transactions on Affective Computing},
volume = {11},
number = {3},
pages = {519-531},
keywords = {Electrodermal activity, Games, Health, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
Zaman, S.; Wesley, A.; Silva, D. Rodrigo Da Cunha; Buddharaju, P.; Akbar, F.; Gao, G.; Mark, G.; Gutierrez-Osuna, R.; Pavlidis, I. Stress and productivity patterns of interrupted, synergistic, and antagonistic office activities Journal Article In: Scientific Data, vol. 6, no. 1, 2020. @article{zaman2019scientificdata,
title = {Stress and productivity patterns of interrupted, synergistic, and antagonistic office activities},
author = {S. Zaman and A. Wesley and D. Rodrigo Da Cunha Silva and P. Buddharaju and F. Akbar and G. Gao and G. Mark and R. Gutierrez-Osuna and I. Pavlidis},
url = {https://www.nature.com/articles/s41597-019-0249-5
https://psi.engr.tamu.edu/wp-content/uploads/2020/04/shaila2019scientificdata.pdf},
year = {2020},
date = {2020-11-08},
journal = {Scientific Data},
volume = {6},
number = {1},
keywords = {Electrodermal activity, Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
Ding, S.; Zhao, G.; Gutierrez-Osuna, R. Improving the Speaker Identity of Non-Parallel Many-to-Many Voice Conversion with Adversarial Speaker Recognition Proceedings Article In: Proc. Interspeech, 2020. @inproceedings{shaojin-2020-interspeech,
title = {Improving the Speaker Identity of Non-Parallel Many-to-Many Voice Conversion with Adversarial Speaker Recognition},
author = {S. Ding and G. Zhao and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2020/08/IS2020_shaojin_Adversarial_speaker_classifier_camera_ready.pdf},
year = {2020},
date = {2020-10-25},
urldate = {2020-10-25},
booktitle = {Proc. Interspeech},
keywords = {Accent conversion, Deep learning, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Das, A.; Zhao, G.; Levis, J.; Chukharev-Hudilainen, E.; Gutierrez-Osuna, R. Understanding the Effect of Voice Quality and Accent on Talker Similarity Proceedings Article In: Proc. Interspeech, 2020. @inproceedings{anurag-2020-interspeech,
title = {Understanding the Effect of Voice Quality and Accent on Talker Similarity},
author = {A. Das and G. Zhao and J. Levis and E. Chukharev-Hudilainen and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2023/02/das2020interspeech.pdf},
year = {2020},
date = {2020-10-24},
urldate = {2020-10-24},
booktitle = {Proc. Interspeech},
keywords = {Accent conversion, Deep learning, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Husseini, D. Al; Zhou, J.; Willhelm, D.; Hastings, T.; Day, G. S.; Zhou, H. -C.; Coté, G. L.; Qian, X.; R. Gutierrez-Osuna, P. T. Lin; Sukhishvili, S. All-Nanoparticle Layer-by-layer Coatings for Mid-IR On-Chip Gas Sensing Journal Article In: Chemical Communications, 2020. @article{alhusseini2020chemComm,
title = {All-Nanoparticle Layer-by-layer Coatings for Mid-IR On-Chip Gas Sensing},
author = {D. Al Husseini and J. Zhou and D. Willhelm and T. Hastings and G. S. Day and H.-C. Zhou and G. L. Coté and X. Qian and R. Gutierrez-Osuna, P. T. Lin and S. Sukhishvili},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2020/10/d0cc05513a.pdf
https://pubs.rsc.org/en/content/articlelanding/2020/cc/d0cc05513a#!divAbstract},
year = {2020},
date = {2020-10-22},
journal = {Chemical Communications},
keywords = {Chemical sensors},
pubstate = {published},
tppubtype = {article}
}
|
Lučić, I.; Silpachai, A.; Levis, J.; Zhao, G; Gutierrez-Osuna, R. The English Pronunciation of Arabic Speakers - A Data-Driven Approach to Segmental Error Identification Journal Article In: Language Teaching Research, 2020. @article{ivana2020ltr,
title = {The English Pronunciation of Arabic Speakers - A Data-Driven Approach to Segmental Error Identification},
author = {I. Lučić and A. Silpachai and J. Levis and G Zhao and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2020/06/1362168820931888.pdf},
year = {2020},
date = {2020-06-18},
journal = {Language Teaching Research},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {article}
}
|
McKechnie, J.; Ahmed, B.; Gutierrez-Osuna, R.; Murray, E.; McCabe, P.; Ballard, K. The influence of type of feedback during tablet-based delivery of intensive treatment for childhood apraxia of speech Journal Article In: Journal of Communication Disorders, 2020. @article{McKechnie2020tabbyTalks,
title = {The influence of type of feedback during tablet-based delivery of intensive treatment for childhood apraxia of speech},
author = {J. McKechnie and B. Ahmed and R. Gutierrez-Osuna and E. Murray and P. McCabe and K. Ballard},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2020/08/1-s2.0-S0021992420300940-main.pdf
https://www.sciencedirect.com/science/article/pii/S0021992420300940},
year = {2020},
date = {2020-05-20},
journal = {Journal of Communication Disorders},
keywords = {Health, Speech},
pubstate = {published},
tppubtype = {article}
}
|
Blank, C.; Zaman, S.; Wesley, A.; Tsiamyrtzis, P.; Silva, D. R. Da Cunha; Gutierrez-Osuna, R.; Mark, G.; Pavlidis, I. Emotional Footprints of Email Interruptions Proceedings Article In: Proc. CHI, 2020. @inproceedings{blank-2020-chi,
title = {Emotional Footprints of Email Interruptions},
author = {C. Blank and S. Zaman and A. Wesley and P. Tsiamyrtzis and D. R. Da Cunha Silva and R. Gutierrez-Osuna and G. Mark and I. Pavlidis},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2020/06/3313831.3376282.pdf},
year = {2020},
date = {2020-04-25},
booktitle = {Proc. CHI},
keywords = {Electrodermal activity, Health, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Hair, A; Markoulli, C; Monroe, P; McKechnie, J; Ballard, K J; Ahmed, B; Gutierrez-Osuna, R Preliminary Results From a Longitudinal Study of a Tablet-Based Speech Therapy Game Proceedings Article In: Extended Abstracts of the 2020 CHI Conference on Human Factors in Computing, ACM, 2020, ISBN: 978-1-4503-6819-3/20/04. @inproceedings{hair2020chi,
title = {Preliminary Results From a Longitudinal Study of a Tablet-Based Speech Therapy Game},
author = {A Hair and C Markoulli and P Monroe and J McKechnie and K J Ballard and B Ahmed and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2020/02/hair2020chi.pdf},
doi = {10.1145/3334480.3382886},
isbn = {978-1-4503-6819-3/20/04},
year = {2020},
date = {2020-04-25},
booktitle = {Extended Abstracts of the 2020 CHI Conference on Human Factors in Computing},
publisher = {ACM},
abstract = {We previously developed a tablet-based speech therapy game called Apraxia World to address barriers to treatment and increase child motivation during therapy. In this study, we examined pronunciation improvements, child engagement over time, and caregiver evaluation performance while using our game. We recruited ten children to play Apraxia World at home during two four-week treatment blocks, separated by a two-week break; nine of ten have completed the protocol at time of writing. In the treatment blocks, children’s utterances were evaluated either by caregivers or an automated pronunciation framework. Preliminary analysis suggests that children made significant therapy gains with Apraxia World, even though caregivers evaluated pronunciation leniently. We also collected a corpus of child speech for offline examination. We will conduct additional analysis once all participants complete the protocol.},
keywords = {Automatic Speech Recognition, Childhood apraxia of speech, Health, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
We previously developed a tablet-based speech therapy game called Apraxia World to address barriers to treatment and increase child motivation during therapy. In this study, we examined pronunciation improvements, child engagement over time, and caregiver evaluation performance while using our game. We recruited ten children to play Apraxia World at home during two four-week treatment blocks, separated by a two-week break; nine of ten have completed the protocol at time of writing. In the treatment blocks, children’s utterances were evaluated either by caregivers or an automated pronunciation framework. Preliminary analysis suggests that children made significant therapy gains with Apraxia World, even though caregivers evaluated pronunciation leniently. We also collected a corpus of child speech for offline examination. We will conduct additional analysis once all participants complete the protocol. |
2019
|
Ding, S.; Zhao, G; Liberatore, C.; Gutierrez-Osuna, R. Learning Structured Sparse Representations for Voice Conversion Journal Article In: IEEE Transactions on Audio, Speech and Language Processing, vol. 28, pp. 343-354, 2019. @article{shaojin-2019-taslp,
title = {Learning Structured Sparse Representations for Voice Conversion},
author = {S. Ding and G Zhao and C. Liberatore and R. Gutierrez-Osuna},
url = {https://ieeexplore.ieee.org/document/8910392
https://psi.engr.tamu.edu/wp-content/uploads/2020/04/shaojin2019taslp.pdf},
doi = {10.1109/TASLP.2019.2955289},
year = {2019},
date = {2019-11-15},
journal = {IEEE Transactions on Audio, Speech and Language Processing},
volume = {28},
pages = {343-354},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {article}
}
|
Ding, S.; Liberatore, C.; Sonsaat, S.; Lučić, I.; Silpachai, A.; Zhao, G; Chukharev-Hudilainen, E.; Levis, J.; Gutierrez-Osuna, R. Golden speaker builder – An interactive tool for pronunciation training Journal Article In: Speech Communication, vol. 115, pp. 51-66, 2019. @article{shaojin-2019-speechcomm,
title = {Golden speaker builder – An interactive tool for pronunciation training},
author = {S. Ding and C. Liberatore and S. Sonsaat and I. Lučić and A. Silpachai and G Zhao and E. Chukharev-Hudilainen and J. Levis and R. Gutierrez-Osuna},
url = {https://www.sciencedirect.com/science/article/pii/S0167639319302675
https://psi.engr.tamu.edu/wp-content/uploads/2019/11/1-s2.0-S0167639319302675-main.pdf
},
year = {2019},
date = {2019-11-14},
journal = {Speech Communication},
volume = {115},
pages = {51-66},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {article}
}
|
Hair, A; Ballard, K J; Ahmed, B; Gutierrez-Osuna, R Evaluating Automatic Speech Recognition for Child Speech Therapy Applications Proceedings Article In: ACM SIGACCESS Conference on Computers and Accessibility, ACM 2019, ISBN: 978-1-4503-6676-2/19/10. @inproceedings{hair2019evaluating,
title = {Evaluating Automatic Speech Recognition for Child Speech Therapy Applications},
author = {A Hair and K J Ballard and B Ahmed and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2019/08/hair2019evaluating.pdf},
doi = {10.1145/3308561.3354606},
isbn = {978-1-4503-6676-2/19/10},
year = {2019},
date = {2019-10-28},
booktitle = {ACM SIGACCESS Conference on Computers and Accessibility},
organization = {ACM},
abstract = {Automatic speech recognition (ASR) technology can be a useful tool in mobile apps for child speech therapy, empowering children to complete their practice with limited caregiver supervision. However, little is known about the feasibility of performing ASR on mobile devices, particularly when training data is limited. In this study, we investigated the performance of two low-resource ASR systems on disordered speech from children. We compared the open-source PocketSphinx (PS) recognizer using adapted acoustic models and a custom template-matching (TM) recognizer. TM and the adapted models significantly out-perform the default PS model. On average, maximum likelihood linear regression and maximum a posteriori adaptation increased PS accuracy from 59.4% to 63.8% and 80.0%, respectively, suggesting that the models successfully captured speaker-specific word production variations. TM reached a mean accuracy of 75.8%. },
keywords = {Automatic Speech Recognition, Childhood apraxia of speech, Health, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
Automatic speech recognition (ASR) technology can be a useful tool in mobile apps for child speech therapy, empowering children to complete their practice with limited caregiver supervision. However, little is known about the feasibility of performing ASR on mobile devices, particularly when training data is limited. In this study, we investigated the performance of two low-resource ASR systems on disordered speech from children. We compared the open-source PocketSphinx (PS) recognizer using adapted acoustic models and a custom template-matching (TM) recognizer. TM and the adapted models significantly out-perform the default PS model. On average, maximum likelihood linear regression and maximum a posteriori adaptation increased PS accuracy from 59.4% to 63.8% and 80.0%, respectively, suggesting that the models successfully captured speaker-specific word production variations. TM reached a mean accuracy of 75.8%. |
Zhao, G; Ding, S.; Gutierrez-Osuna, Ricardo Foreign Accent Conversion by Synthesizing Speech from Phonetic Posteriorgrams Proceedings Article In: Proc. Interspeech, 2019. @inproceedings{guanlong2019-interspeech,
title = {Foreign Accent Conversion by Synthesizing Speech from Phonetic Posteriorgrams},
author = {G Zhao and S. Ding and Ricardo Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2019/07/zhao2019interspeech.pdf},
year = {2019},
date = {2019-09-15},
urldate = {2019-09-15},
booktitle = {Proc. Interspeech},
keywords = {Accent conversion, Deep learning, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Ding, S.; Gutierrez-Osuna, Ricardo Group Latent Embedding for Vector Quantized Variational Autoencoder in Non-Parallel Voice Conversion Proceedings Article In: Proc. Interspeech, 2019. @inproceedings{shaojin2019-interspeech,
title = {Group Latent Embedding for Vector Quantized Variational Autoencoder in Non-Parallel Voice Conversion},
author = {S. Ding and Ricardo Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2019/06/ding2019interspeech.pdf},
doi = {10.21437/Interspeech.2019-1198},
year = {2019},
date = {2019-09-15},
booktitle = {Proc. Interspeech},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Akbar, F.; Mark, G.; Pavlidis, I.; Gutierrez-Osuna, R. An Empirical Study Comparing Unobtrusive Physiological Sensors for Stress Detection in Computer Work Journal Article In: Sensors, vol. 19, 2019. @article{akbar2019sensors,
title = {An Empirical Study Comparing Unobtrusive Physiological Sensors for Stress Detection in Computer Work},
author = {F. Akbar and G. Mark and I. Pavlidis and R. Gutierrez-Osuna},
url = {https://www.mdpi.com/1424-8220/19/17/3766
https://psi.engr.tamu.edu/wp-content/uploads/2020/04/akbar2019sensors.pdf},
year = {2019},
date = {2019-08-30},
journal = {Sensors},
volume = {19},
keywords = {Electrodermal activity, Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
Zhao, G; Gutierrez-Osuna, R Using Phonetic Posteriorgram Based Frame Pairing for Segmental Accent Conversion Journal Article In: IEEE/ACM Transactions on Audio, Speech, and Language Processing, vol. 27, no. 10, pp. 1649-1660, 2019, ISSN: 2329-9290. @article{zhao-2019-taslp,
title = {Using Phonetic Posteriorgram Based Frame Pairing for Segmental Accent Conversion},
author = {G Zhao and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2020/04/zhao2019taslp.pdf},
doi = {10.1109/TASLP.2019.2926754},
issn = {2329-9290},
year = {2019},
date = {2019-07-04},
urldate = {2019-07-04},
journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
volume = {27},
number = {10},
pages = {1649-1660},
abstract = {Accent conversion (AC) aims to transform non-native utterances to sound as if the speaker had a native accent. This can be achieved by mapping source speech spectra from a native speaker into the acoustic space of the target non-native speaker. In prior work, we proposed an AC approach that matches frames between the two speakers based on their acoustic similarity after compensating for differences in vocal tract length. In this paper, we propose a new approach that matches frames between the two speakers based on their phonetic (rather than acoustic) similarity. Namely, we map frames from the two speakers into a phonetic posteriorgram using speaker-independent acoustic models trained on native speech. We thoroughly evaluate the approach on a speech corpus containing multiple native and non-native speakers. The proposed algorithm outperforms the prior approach, improving ratings of acoustic quality (22% increase in mean opinion score) and native accent (69% preference) while retaining the voice quality of the non-native speaker. Furthermore, we show that the approach can be used in the reverse conversion direction, i.e., generating speech with a native speaker's voice quality and a non-native accent. Finally, we show that this approach can be applied to non-parallel training data, achieving the same accent conversion performance.},
keywords = {Accent conversion, Deep learning, Speech},
pubstate = {published},
tppubtype = {article}
}
Accent conversion (AC) aims to transform non-native utterances to sound as if the speaker had a native accent. This can be achieved by mapping source speech spectra from a native speaker into the acoustic space of the target non-native speaker. In prior work, we proposed an AC approach that matches frames between the two speakers based on their acoustic similarity after compensating for differences in vocal tract length. In this paper, we propose a new approach that matches frames between the two speakers based on their phonetic (rather than acoustic) similarity. Namely, we map frames from the two speakers into a phonetic posteriorgram using speaker-independent acoustic models trained on native speech. We thoroughly evaluate the approach on a speech corpus containing multiple native and non-native speakers. The proposed algorithm outperforms the prior approach, improving ratings of acoustic quality (22% increase in mean opinion score) and native accent (69% preference) while retaining the voice quality of the non-native speaker. Furthermore, we show that the approach can be used in the reverse conversion direction, i.e., generating speech with a native speaker's voice quality and a non-native accent. Finally, we show that this approach can be applied to non-parallel training data, achieving the same accent conversion performance. |
Monteiro, C. D. D.; Shipman, F. M.; III, S. Duggina; Gutierrez-Osuna, R. Tradeoffs in the Efficient Detection of Sign Language Content in Video Sharing Sites Journal Article In: ACM Transactions on Accessible Computing, vol. 12, no. 2, pp. 1-16, 2019. @article{caio2019asl,
title = {Tradeoffs in the Efficient Detection of Sign Language Content in Video Sharing Sites},
author = {C. D. D. Monteiro and F. M. Shipman and III, S. Duggina and R. Gutierrez-Osuna},
url = {https://dl.acm.org/doi/10.1145/3325863
https://psi.engr.tamu.edu/wp-content/uploads/2020/04/caio2019asl.pdf},
year = {2019},
date = {2019-06-01},
journal = {ACM Transactions on Accessible Computing},
volume = {12},
number = {2},
pages = {1-16},
keywords = {Computer vision, Speech},
pubstate = {published},
tppubtype = {article}
}
|
Huo, Z.; Mortazavi, B. J.; Chaspari, T.; Deutz, N.; Ruebush, L.; Gutierrez-Osuna, R. Predicting the meal macronutrient composition from continuous glucose monitors Proceedings Article In: Proc. IEEE Conf. on Biomedical and Health Informatics, 2019. @inproceedings{huo-2019-bhi,
title = {Predicting the meal macronutrient composition from continuous glucose monitors},
author = {Z. Huo and B. J. Mortazavi and T. Chaspari and N. Deutz and L. Ruebush and R. Gutierrez-Osuna},
year = {2019},
date = {2019-05-19},
booktitle = {Proc. IEEE Conf. on Biomedical and Health Informatics},
keywords = {Chemical sensors, Continuous glucose monitors, Health, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Parnandi, A; Gutierrez-Osuna, R Visual Biofeedback and Game Adaptation in Relaxation Skill Transfer Journal Article In: IEEE Transactions on Affective Computing, vol. 10, no. 2, pp. 276 - 289, 2019. @article{parnandi21017tac,
title = {Visual Biofeedback and Game Adaptation in Relaxation Skill Transfer},
author = {A Parnandi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2019/06/avinash-2019-tac.pdf},
year = {2019},
date = {2019-05-17},
journal = {IEEE Transactions on Affective Computing},
volume = {10},
number = {2},
pages = {276 - 289},
keywords = {Electrodermal activity, Games, Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
Akbar, F.; Bayraktaroglu, A. E.; Gao, G.; Grover, T.; Mark, G.; Storer, K.; Silva, D. R. Da Cunha; Gutierrez-Osuna, R.; Wang, Z.; Buddharaju, P.; Jones, N. Cooper; Pavlidis, I.; Wesley, A.; S. Zaman, Email Makes You Sweat: Examining Email Interruptions and Stress with Thermal Imaging Proceedings Article In: Proc. CHI, 2019. @inproceedings{akbar-2019-hci,
title = {Email Makes You Sweat: Examining Email Interruptions and Stress with Thermal Imaging},
author = {F. Akbar and A. E. Bayraktaroglu and G. Gao and T. Grover and G. Mark and K. Storer and D. R. Da Cunha Silva and R. Gutierrez-Osuna and Z. Wang and P. Buddharaju and N. Cooper Jones and I. Pavlidis and A. Wesley and S. Zaman, },
url = {https://psi.engr.tamu.edu/wp-content/uploads/2019/06/paper668.pdf
https://dl.acm.org/citation.cfm?id=3300898},
year = {2019},
date = {2019-05-04},
booktitle = {Proc. CHI},
journal = {Proc. CHI 2019},
keywords = {Electrodermal activity, Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
2018
|
Ahmed, B; Monroe, P; Hair, A; Tan, C-T; Gutierrez-Osuna, R; Ballard, K J Speech-driven mobile games for speech therapy: User experiences and feasibility Journal Article In: International Journal of Speech-Language Pathology , vol. 20, no. 6, pp. 644-658, 2018. @article{ahmed2018ijslp,
title = {Speech-driven mobile games for speech therapy: User experiences and feasibility},
author = {B Ahmed and P Monroe and A Hair and C-T Tan and R Gutierrez-Osuna and K J Ballard},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2019/06/ahmed-2018-ijslp.pdf
https://doi.org/10.1080/17549507.2018.1513562},
year = {2018},
date = {2018-10-30},
journal = {International Journal of Speech-Language Pathology },
volume = {20},
number = {6},
pages = {644-658},
keywords = {Childhood apraxia of speech, Games, Health, Speech},
pubstate = {published},
tppubtype = {article}
}
|
Levis, J.; Chukharev-Hudilainen, E.; Gutierrez-Osuna, R.; Lucic, I.; Silpachai, A.; Sonsaat, S. Golden Speaker: Learner Experience with Computer-assisted Pronunciation Practice Proceedings Article In: Proc. Pronunciation in Second Language Learning and Teaching Conference, 2018. @inproceedings{levis2018psslt,
title = {Golden Speaker: Learner Experience with Computer-assisted Pronunciation Practice},
author = {J. Levis and E. Chukharev-Hudilainen and R. Gutierrez-Osuna and I. Lucic and A. Silpachai and S. Sonsaat},
year = {2018},
date = {2018-09-06},
booktitle = {Proc. Pronunciation in Second Language Learning and Teaching Conference},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Ding, S.; Liberatore, C.; Gutierrez-Osuna, R. Learning Structured Dictionaries for Exemplar-based Voice Conversion Proceedings Article In: Proc. Interspeech, 2018. @inproceedings{ding2018interspeech1,
title = {Learning Structured Dictionaries for Exemplar-based Voice Conversion},
author = {S. Ding and C. Liberatore and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/09/ding2018interspeech1.pdf},
doi = {10.21437/Interspeech.2018-1295},
year = {2018},
date = {2018-09-02},
booktitle = {Proc. Interspeech},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Zhao, G; Sonsaat, S; Silpachai, A; Lucic, I; Chukharev-Hudilainen, E; Levis, J; Gutierrez-Osuna, R L2-ARCTIC: A Non-Native English Speech Corpus Proceedings Article In: Proc. Interspeech, 2018. @inproceedings{zhao2018interspeech,
title = {L2-ARCTIC: A Non-Native English Speech Corpus},
author = {G Zhao and S Sonsaat and A Silpachai and I Lucic and E Chukharev-Hudilainen and J Levis and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/08/zhao2018interspeech.pdf
https://psi.engr.tamu.edu/l2-arctic-corpus/},
year = {2018},
date = {2018-09-02},
booktitle = {Proc. Interspeech},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
McKechnie, J.; Ahmed, B.; Gutierrez-Osuna, R.; Monroe, P.; McCabe, P.; Ballard, K. J. Automated speech analysis tools for children’s speech production: A systematic literature review Journal Article In: International Journal of Speech-Language Pathology, vol. 20, no. 6, pp. 583–598, 2018. @article{mcKechnie2018review,
title = {Automated speech analysis tools for children’s speech production: A systematic literature review},
author = {J. McKechnie and B. Ahmed and R. Gutierrez-Osuna and P. Monroe and P. McCabe and K. J. Ballard},
url = {https://doi.org/10.1080/17549507.2018.1477991
https://psi.engr.tamu.edu/wp-content/uploads/2019/06/mckechnie-2018-ijslp.pdf},
year = {2018},
date = {2018-09-02},
journal = {International Journal of Speech-Language Pathology},
volume = {20},
number = {6},
pages = {583–598},
keywords = {Childhood apraxia of speech, Health, Speech},
pubstate = {published},
tppubtype = {article}
}
|
Ding, S.; Zhao, G; Liberatore, C.; Gutierrez-Osuna, R. Improving Sparse Representations in Exemplar-Based Voice Conversion with a Phoneme-Selective Objective Function Proceedings Article In: Proc. Interspeech, 2018. @inproceedings{ding2018interspeech2,
title = {Improving Sparse Representations in Exemplar-Based Voice Conversion with a Phoneme-Selective Objective Function},
author = {S. Ding and G Zhao and C. Liberatore and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/09/ding2018interspeech2.pdf},
doi = {10.21437/Interspeech.2018-1272},
year = {2018},
date = {2018-09-02},
booktitle = {Proc. Interspeech},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Goel, N.; Chaspari, T.; Mortazavi, B. J.; Prioleau, T.; A. Sabharwal,; Gutierrez-Osuna, R. Knowledge-driven dictionaries for sparse representation of continuous glucose monitoring signals Proceedings Article In: Proc. EMBC, 2018. @inproceedings{chaspari2018cgm,
title = {Knowledge-driven dictionaries for sparse representation of continuous glucose monitoring signals},
author = {N. Goel and T. Chaspari and B. J. Mortazavi and T. Prioleau and A. Sabharwal, and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/05/chaspari-2018-embc.pdf},
year = {2018},
date = {2018-07-17},
booktitle = {Proc. EMBC},
volume = {in press},
keywords = {Chemical sensors, Continuous glucose monitors, Health, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Hair, A; Monroe, P; Ahmed, B; Ballard, K J; Gutierrez-Osuna, R Apraxia World: A Speech Therapy Game for Children with Speech Sound Disorders Proceedings Article In: Proceedings of the 2018 Conference on Interaction Design and Children, ACM, 2018, ISBN: 978-1-4503-5152-2/18/06. @inproceedings{hair2018idc,
title = {Apraxia World: A Speech Therapy Game for Children with Speech Sound Disorders},
author = {A Hair and P Monroe and B Ahmed and K J Ballard and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/04/hair2018idc.pdf},
doi = {10.1145/3202185.3202733},
isbn = {978-1-4503-5152-2/18/06},
year = {2018},
date = {2018-06-19},
booktitle = {Proceedings of the 2018 Conference on Interaction Design and Children},
publisher = {ACM},
abstract = {This paper presents Apraxia World, a remote therapy tool for speech sound disorders that integrates speech exercises into an engaging platformer-style game. In Apraxia World, the player controls the avatar with virtual buttons/joystick, whereas speech input is associated with assets needed to advance from one level to the next. We tested performance and child preference of two strategies for delivering speech exercises: during each level, and after it. Most children indicated that doing exercises after completing each level was less disruptive and preferable to doing exercises scattered through the level. We also found that children liked having perceived control over the game (character appearance, exercise behavior). Our results indicate that (i) a familiar style of game successfully engages children, (ii) speech exercises function well when decoupled from game control, and (iii) children are willing to complete required speech exercises while playing a game they enjoy.},
keywords = {Childhood apraxia of speech, Health, Mobile computing, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
This paper presents Apraxia World, a remote therapy tool for speech sound disorders that integrates speech exercises into an engaging platformer-style game. In Apraxia World, the player controls the avatar with virtual buttons/joystick, whereas speech input is associated with assets needed to advance from one level to the next. We tested performance and child preference of two strategies for delivering speech exercises: during each level, and after it. Most children indicated that doing exercises after completing each level was less disruptive and preferable to doing exercises scattered through the level. We also found that children liked having perceived control over the game (character appearance, exercise behavior). Our results indicate that (i) a familiar style of game successfully engages children, (ii) speech exercises function well when decoupled from game control, and (iii) children are willing to complete required speech exercises while playing a game they enjoy. |
Zhao, G; Sonsaat, S; Levis, J; Chukharev-Hudilainen, E; Gutierrez-Osuna, R Accent conversion using phonetic posteriorgrams Proceedings Article In: Proc. ICASSP, 2018. @inproceedings{zhao2018icassp,
title = {Accent conversion using phonetic posteriorgrams},
author = {G Zhao and S Sonsaat and J Levis and E Chukharev-Hudilainen and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/03/zhao2018icassp.pdf
http://people.tamu.edu/~guanlong.zhao/icassp18_demo.html
https://psi.engr.tamu.edu/l2-arctic-corpus/
https://github.com/guanlongzhao/ppg-gmm},
year = {2018},
date = {2018-04-15},
urldate = {2018-04-15},
booktitle = {Proc. ICASSP},
keywords = {Accent conversion, Deep learning, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Liberatore, C; Zhao, G; Gutierrez-Osuna, R Voice Conversion through Residual Warping in a Sparse, Anchor-Based Representation of Speech Proceedings Article In: Proc. ICASSP, 2018. @inproceedings{liberatore2018icassp,
title = {Voice Conversion through Residual Warping in a Sparse, Anchor-Based Representation of Speech},
author = {C Liberatore and G Zhao and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/03/liberatore-icassp2018.pdf},
year = {2018},
date = {2018-04-15},
booktitle = {Proc. ICASSP},
abstract = {In previous work we presented a Sparse, Anchor-Based Representation of speech (SABR) that uses phonemic “anchors” to represent an utterance with a set of sparse non-negative weights. SABR is speaker-independent: combining weights from a source speaker with anchors from a target speaker can be used for voice conversion. Here, we present an extension of the original SABR that significantly improves voice conversion synthesis. Namely, we take the residual signal from the SABR decomposition of the source speaker’s utterance, and warp it to the target speaker’s space using a weighted warping function learned from pairs of source-target
anchors. Using subjective and objective evaluations, we examine the performance of adding the warped residual (SABR+Res) to the original synthesis (SABR). Specifically, listeners rated SABR+Res with an average mean opinion score (MOS) of 3.6, a significant improvement compared to 2.2 MOS for SABR alone (𝑝 < 0.01) and
2.5 MOS for a baseline GMM method (𝑝 < 0.01). In an XAB speaker identity test, listeners correctly identified the identity of SABR+Res (81%) and SABR (84%) as requently as a GMM method (82%) (𝑝 = 0.70, 𝑝 = 0.35). These results indicate that adding the warped residual can dramatically improve synthesis while retaining the
desirable independent qualities of SABR models.},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
In previous work we presented a Sparse, Anchor-Based Representation of speech (SABR) that uses phonemic “anchors” to represent an utterance with a set of sparse non-negative weights. SABR is speaker-independent: combining weights from a source speaker with anchors from a target speaker can be used for voice conversion. Here, we present an extension of the original SABR that significantly improves voice conversion synthesis. Namely, we take the residual signal from the SABR decomposition of the source speaker’s utterance, and warp it to the target speaker’s space using a weighted warping function learned from pairs of source-target
anchors. Using subjective and objective evaluations, we examine the performance of adding the warped residual (SABR+Res) to the original synthesis (SABR). Specifically, listeners rated SABR+Res with an average mean opinion score (MOS) of 3.6, a significant improvement compared to 2.2 MOS for SABR alone (𝑝 < 0.01) and
2.5 MOS for a baseline GMM method (𝑝 < 0.01). In an XAB speaker identity test, listeners correctly identified the identity of SABR+Res (81%) and SABR (84%) as requently as a GMM method (82%) (𝑝 = 0.70, 𝑝 = 0.35). These results indicate that adding the warped residual can dramatically improve synthesis while retaining the
desirable independent qualities of SABR models. |
Angello, G.; Zhao, G.; Manam, A. B.; Gutierrez-Osuna, R. Training Behavior of Successful Tacton-Phoneme Learners Proceedings Article In: IEEE Haptics Symposium, 2018. @inproceedings{genna2018tactons,
title = {Training Behavior of Successful Tacton-Phoneme Learners},
author = {G. Angello and G. Zhao and A. B. Manam and R. Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2022/01/AngelloHaptics2018-2.pdf},
year = {2018},
date = {2018-03-25},
booktitle = {IEEE Haptics Symposium},
keywords = {Other, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Jin, Tiening; Zhou, Juntao; Wang, Zelun; Gutierrez-Osuna, Ricardo; Ahn, Charles; Hwang, Wonjun; Park, Ken; Lin, Pao-Tai Real-time Gas Mixture Analysis Using Mid-infrared Membrane Microcavities Journal Article In: Analytical Chemistry, vol. 90, no. 7, pp. 4348-4353, 2018. @article{jin2018-ac,
title = {Real-time Gas Mixture Analysis Using Mid-infrared Membrane Microcavities},
author = {Tiening Jin and Juntao Zhou and Zelun Wang and Ricardo Gutierrez-Osuna and Charles Ahn and Wonjun Hwang and Ken Park and Pao-Tai Lin },
url = {https://www.ncbi.nlm.nih.gov/pubmed/29509404},
year = {2018},
date = {2018-03-08},
journal = {Analytical Chemistry},
volume = {90},
number = {7},
pages = {4348-4353},
keywords = {Chemical sensors, Infrared spectroscopy},
pubstate = {published},
tppubtype = {article}
}
|
Chaspari, T.; Mortazavi, B.; Prioleau, T.; Sabharwal, A.; Gutierrez-Osuna, R. Sparse representation models of continuous glucose monitoring time-series Proceedings Article In: Proc. 5th International Conference on Wearable and Implantable Body Sensor Networks, 2018. @inproceedings{theodora2018bsn,
title = {Sparse representation models of continuous glucose monitoring time-series},
author = {T. Chaspari and B. Mortazavi and T. Prioleau and A. Sabharwal and R. Gutierrez-Osuna },
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/05/chaspari-2018-bsn.pdf},
year = {2018},
date = {2018-03-04},
booktitle = { Proc. 5th International Conference on Wearable and Implantable Body Sensor Networks},
keywords = {Chemical sensors, Continuous glucose monitors, Health, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Wang, Z; Parnandi, A; Gutierrez-Osuna, R BioPad: Leveraging off-the-Shelf Video Games for Stress Self-Regulation Journal Article In: IEEE Journal of Biomedical and Health Informatics, in press, 2018. @article{wang2018jbhi,
title = {BioPad: Leveraging off-the-Shelf Video Games for Stress Self-Regulation},
author = {Z Wang and A Parnandi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/wang2018jbhi.pdf},
year = {2018},
date = {2018-01-01},
journal = {IEEE Journal of Biomedical and Health Informatics, in press},
keywords = {Electrodermal activity, Games, Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
2017
|
Shipman, F; Duggina, S; Monteiro, C; Gutierrez-Osuna, R Speed-Accuracy Tradeoffs for Detecting Sign Language Content in Video Sharing Sites Proceedings Article In: Proceedings of ACM SIGACCESS Conference on Computers and Accessibility (ASSETS 2017), pp. 185-189, 2017. @inproceedings{shipman2017assets,
title = {Speed-Accuracy Tradeoffs for Detecting Sign Language Content in Video Sharing Sites},
author = {F Shipman and S Duggina and C Monteiro and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/shipman2017assets.pdf},
year = {2017},
date = {2017-11-21},
booktitle = {Proceedings of ACM SIGACCESS Conference on Computers and Accessibility (ASSETS 2017)},
pages = {185-189},
keywords = {Computer vision, Gestures, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Hair, A; Gutierrez-Osuna, R Deep Breaths: An Internally- and Externally-Paced Deep Breathing Guide Workshop Proc. 7th International Conference on Affective Computing and Intelligent Interaction Workshops and Demos (ACIIW), 2017. @workshop{hair2017acii,
title = {Deep Breaths: An Internally- and Externally-Paced Deep Breathing Guide},
author = {A Hair and R Gutierrez-Osuna },
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/hair2017acii.pdf},
year = {2017},
date = {2017-10-23},
booktitle = {Proc. 7th International Conference on Affective Computing and Intelligent Interaction Workshops and Demos (ACIIW)},
abstract = {Deep breathing is a simple and intuitive technique for reducing stress, but requires familiarity with breathing exercises and suitable breathing parameters. We present Deep Breaths, a mobile tool that allows users to experiment with various respiratory pacing signals in order to maximize relaxation. Deep Breaths provides a stationary (i.e., clock-based) pacing signal as well as an adaptive pacing signal that follows fluctuations in the user’s heart rate. Deep Breaths also provides real-time visualizations of various standard measures of relaxation. This demonstration aims to illustrate how our system can be used for relaxation training.},
keywords = {Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {workshop}
}
Deep breathing is a simple and intuitive technique for reducing stress, but requires familiarity with breathing exercises and suitable breathing parameters. We present Deep Breaths, a mobile tool that allows users to experiment with various respiratory pacing signals in order to maximize relaxation. Deep Breaths provides a stationary (i.e., clock-based) pacing signal as well as an adaptive pacing signal that follows fluctuations in the user’s heart rate. Deep Breaths also provides real-time visualizations of various standard measures of relaxation. This demonstration aims to illustrate how our system can be used for relaxation training. |
Nguyen, K. N.; Liu, X.; Komogortsevz, O.; Gutierrez-Osuna, R.; Choe, Y. Explanation of the Perceptual Oblique Effect Based on the Fidelity of Oculomotor Control During Saccades Proceedings Article In: 2017 Joint IEEE International Conference on Development and Learning, pp. 15-20, 2017. @inproceedings{saccades-2017-khuong,
title = {Explanation of the Perceptual Oblique Effect Based on the Fidelity of Oculomotor Control During Saccades},
author = {K. N. Nguyen and X. Liu and O. Komogortsevz and R. Gutierrez-Osuna and Y. Choe},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2019/05/08329781-1.pdf},
year = {2017},
date = {2017-09-18},
booktitle = {2017 Joint IEEE International Conference on Development and Learning},
pages = {15-20},
keywords = {Computer vision},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Christy, M; Gupta, A; Grumbach, E; Mandel, L; Furuta, R; Gutierrez-Osuna, R Mass Digitization of Early Modern Texts with Optical Character Recognition Journal Article In: ACM Journal on Computing and Cultural Heritage, vol. in press, 2017. @article{christy2017emop,
title = {Mass Digitization of Early Modern Texts with Optical Character Recognition},
author = {M Christy and A Gupta and E Grumbach and L Mandel and R Furuta and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/christy2017jcch.pdf},
year = {2017},
date = {2017-03-22},
journal = {ACM Journal on Computing and Cultural Heritage},
volume = {in press},
keywords = {OCR},
pubstate = {published},
tppubtype = {article}
}
|
Karkamkar, P; Gutierrez-Osuna, R Optical Computation of Chemometrics Projections using a Digital Micromirror Device Proceedings Article In: Proc. International Symposium on Olfaction and Electronic Nose (ISOEN), 2017. @inproceedings{karkamkar2017isoen,
title = {Optical Computation of Chemometrics Projections using a Digital Micromirror Device},
author = {P Karkamkar and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/purvesh2017isoen.pdf},
year = {2017},
date = {2017-03-15},
booktitle = {Proc. International Symposium on Olfaction and Electronic Nose (ISOEN)},
keywords = {Active sensing, Infrared spectroscopy},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Wang, Z; Gutierrez-Osuna, R Mixture quantification in the presence of unknown interferences Proceedings Article In: Proc. International Symposium on Olfaction and Electronic Nose (ISOEN), 2017. @inproceedings{wang2017isoen,
title = {Mixture quantification in the presence of unknown interferences},
author = {Z Wang and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/wang2017isoen.pdf},
year = {2017},
date = {2017-03-15},
booktitle = {Proc. International Symposium on Olfaction and Electronic Nose (ISOEN)},
journal = {Proc. International Symposium on Olfaction and Electronic Nose (ISOEN)},
keywords = {Active sensing, Chemical sensors, Infrared spectroscopy},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Zhao, G; Gutierrez-Osuna, R Exemplar selection methods in voice conversion Proceedings Article In: Proc. 42nd International Conference on Acoustics, Speech, and Signal Processing (ICASSP), pp. 5525-5529, 2017. @inproceedings{zhao-2017-icassp,
title = {Exemplar selection methods in voice conversion},
author = {G Zhao and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/zhao2017icassp.pdf
http://people.tamu.edu/~guanlong.zhao/spring17/icassp17},
doi = {10.1109/ICASSP.2017.7953213},
year = {2017},
date = {2017-03-05},
booktitle = {Proc. 42nd International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
pages = {5525-5529},
keywords = {Speech, Voice conversion},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Parnandi, A; Gutierrez-Osuna, R Physiological modalities for relaxation skill transfer in biofeedback games Journal Article In: Journal of Biomedical and Health Informatics, vol. in press, 2017. @article{parnandi2017jbhi,
title = {Physiological modalities for relaxation skill transfer in biofeedback games},
author = {A Parnandi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/avinash2017jbhi.pdf},
year = {2017},
date = {2017-03-01},
journal = {Journal of Biomedical and Health Informatics},
volume = {in press},
keywords = {Electrodermal activity, Games, Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
2016
|
Monteiro, C; Mathew, C; Shipman, F; Gutierrez-Osuna, R Detecting and Identifying Sign Languages through Visual Features Proceedings Article In: 2016 IEEE International Symposium on Multimedia (ISM), 2016. @inproceedings{monteiro2016ism,
title = {Detecting and Identifying Sign Languages through Visual Features},
author = {C Monteiro and C Mathew and F Shipman and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/monteiro2016ism.pdf},
year = {2016},
date = {2016-12-11},
booktitle = {2016 IEEE International Symposium on Multimedia (ISM)},
keywords = {Computer vision, Gestures, Pattern recognition},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Aryal, S; Gutierrez-Osuna, R Comparing Articulatory and Acoustic Strategies for Reducing Non-Native Accents Proceedings Article In: Proc. Interspeech, 2016. @inproceedings{aryal-2016-interspeech,
title = {Comparing Articulatory and Acoustic Strategies for Reducing Non-Native Accents},
author = {S Aryal and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/aryal2016interspeech.pdf},
year = {2016},
date = {2016-09-08},
booktitle = {Proc. Interspeech},
keywords = {Accent conversion, Articulatory synthesis, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Liberatore, C; Gutierrez-Osuna, R Generating Gestural Scores from Acoustics Through a Sparse Anchor-Based Representation of Speech Proceedings Article In: Proc. Interspeech, 2016. @inproceedings{liberatore2016interspeech,
title = {Generating Gestural Scores from Acoustics Through a Sparse Anchor-Based Representation of Speech},
author = {C Liberatore and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/liberatore2016interspeech.pdf},
year = {2016},
date = {2016-09-08},
booktitle = {Proc. Interspeech},
keywords = {Articulatory synthesis, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Huang, J; Gutierrez-Osuna, R Active wavelength selection for mixture identification with tunable mid-infrared detectors Journal Article In: Analytica Chimica Acta, vol. in press, 2016. @article{huang2016aca,
title = {Active wavelength selection for mixture identification with tunable mid-infrared detectors},
author = {J Huang and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/huang2016aca.pdf},
year = {2016},
date = {2016-08-08},
journal = {Analytica Chimica Acta},
volume = {in press},
keywords = {Active sensing, Chemical sensors, Infrared spectroscopy},
pubstate = {published},
tppubtype = {article}
}
|
Li, J; Gutierrez-Osuna, R; Hodges, R D; Luckey, G; Crowell, J; Schiffman, S S; Nagle, H T Using Field Asymmetric Ion Mobility Spectrometry for Odor Assessment of Automobile Interior Components Journal Article In: IEEE Sensors Journal, vol. in press, 2016. @article{li2016sj,
title = {Using Field Asymmetric Ion Mobility Spectrometry for Odor Assessment of Automobile Interior Components},
author = {J Li and R Gutierrez-Osuna and R D Hodges and G Luckey and J Crowell and S S Schiffman and H T Nagle},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/li2016sj-1.pdf},
year = {2016},
date = {2016-05-01},
journal = {IEEE Sensors Journal},
volume = {in press},
keywords = {Chemical sensors, Electronic nose, Machine olfaction},
pubstate = {published},
tppubtype = {article}
}
|
Shahin, M; Gutierrez-Osuna, R; Ahmed, B Classification of bisyllabic lexical stress patterns in disordered speech using deep learning Proceedings Article In: Proc. International Conference on Acoustics, Speech, and Signal Processing, 2016. @inproceedings{shahin2016icassp,
title = {Classification of bisyllabic lexical stress patterns in disordered speech using deep learning},
author = {M Shahin and R Gutierrez-Osuna and B Ahmed},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/shahin2016icassp.pdf},
year = {2016},
date = {2016-03-20},
booktitle = {Proc. International Conference on Acoustics, Speech, and Signal Processing},
keywords = {Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
McKechnie, J; Ballard, K J; McCabe, P; Murray, E; Lan, T; Gutierrez-Osuna, R; Ahmed, B Influence of type of feedback on effect of tablet-based delivery of intensive speech therapy in children with Childhood Apraxia of Speech Proceedings Article In: Proceedings of the Motor Speech Conference, 2016. @inproceedings{mckechnie-2016-motorspeech,
title = {Influence of type of feedback on effect of tablet-based delivery of intensive speech therapy in children with Childhood Apraxia of Speech},
author = {J McKechnie and K J Ballard and P McCabe and E Murray and T Lan and R Gutierrez-Osuna and B Ahmed},
year = {2016},
date = {2016-03-03},
booktitle = {Proceedings of the Motor Speech Conference},
journal = {Motor Speech Conference},
keywords = {Childhood apraxia of speech, Games, Health, Mobile computing, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Aryal, S; Gutierrez-Osuna, R Data driven articulatory synthesis with deep neural networks Journal Article In: Computer Speech and Language, vol. 36, pp. 260-273, 2016. @article{aryal-2015-cls,
title = {Data driven articulatory synthesis with deep neural networks},
author = {S Aryal and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/aryal2016csl.pdf},
year = {2016},
date = {2016-03-01},
urldate = {2016-03-01},
journal = {Computer Speech and Language},
volume = {36},
pages = {260-273},
keywords = {Accent conversion, Articulatory synthesis, Deep learning, Speech},
pubstate = {published},
tppubtype = {article}
}
|
2015
|
Li, J; Gutierrez-Osuna, R; Hodges, R D; Luckey, G; Crowell, J; Schiffman, S S; Nagle, H T Odor Assessment of Automobile Interior Components Using Ion Mobility Spectrometry Proceedings Article In: IEEE Sensors Conference, 2015. @inproceedings{li2015sensors,
title = {Odor Assessment of Automobile Interior Components Using Ion Mobility Spectrometry},
author = {J Li and R Gutierrez-Osuna and R D Hodges and G Luckey and J Crowell and S S Schiffman and H T Nagle},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/li2015sensors.pdf},
year = {2015},
date = {2015-11-01},
booktitle = {IEEE Sensors Conference},
keywords = {Chemical sensors, Infrared spectroscopy, Olfaction},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Parnandi, A; Karappa, V; Lan, T; Shahin, M; McKechnie, J; Ballard, K; Ahmed, B; Gutierrez-Osuna, R Development of a remote therapy tool for childhood apraxia of speech Journal Article In: ACM Transactions on Accessible Computing, vol. 7, no. 3, pp. 10:1-10:23, 2015. @article{parnandi2015taccess,
title = {Development of a remote therapy tool for childhood apraxia of speech},
author = {A Parnandi and V Karappa and T Lan and M Shahin and J McKechnie and K Ballard and B Ahmed and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/parnandi2015taccess.pdf},
year = {2015},
date = {2015-11-01},
journal = {ACM Transactions on Accessible Computing},
volume = {7},
number = {3},
pages = {10:1-10:23},
keywords = {Childhood apraxia of speech, Games, Health, Mobile computing, Speech},
pubstate = {published},
tppubtype = {article}
}
|
Aryal, S; Gutierrez-Osuna, R Articulatory-based conversion of foreign accents with deep neural networks Proceedings Article In: Proc. Interspeech, pp. 3385-3389, 2015. @inproceedings{aryal2015interspeech,
title = {Articulatory-based conversion of foreign accents with deep neural networks},
author = {S Aryal and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/aryal2015interspeech.pdf},
year = {2015},
date = {2015-09-06},
urldate = {2015-09-06},
booktitle = {Proc. Interspeech},
pages = {3385-3389},
keywords = {Accent conversion, Articulatory synthesis, Deep learning, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Liberatore, C; Aryal, S; Wang, Z; Polsley, S; Gutierrez-Osuna, R SABR: Sparse, Anchor-Based Representation of the Speech Signal Proceedings Article In: Proc. Interspeech 2015, pp. 608-612, 2015. @inproceedings{liberatore2015interspeech,
title = {SABR: Sparse, Anchor-Based Representation of the Speech Signal},
author = {C Liberatore and S Aryal and Z Wang and S Polsley and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/liberatore2015interspeech.pdf},
year = {2015},
date = {2015-09-06},
booktitle = {Proc. Interspeech 2015},
pages = {608-612},
abstract = {We present SABR (Sparse, Anchor-Based Representation), an analysis technique to decompose the speech signal into
speaker-dependent and speaker-independent components. Given a collection of utterances for a particular
speaker, SABR uses the centroid for each phoneme as an acoustic “anchor,” then applies Lasso regularization to
the method on a speaker-independent phoneme recognition task and a voice conversion task. Using a linear classifier,
SABR weights achieve significantly higher phoneme recognition rates than Mel frequency Cepstral coefficients. SABR weights can also be used directly to perform accent conversion without the need to train a speakerto-speaker regression model.},
keywords = {Accent conversion, Articulatory synthesis},
pubstate = {published},
tppubtype = {inproceedings}
}
We present SABR (Sparse, Anchor-Based Representation), an analysis technique to decompose the speech signal into
speaker-dependent and speaker-independent components. Given a collection of utterances for a particular
speaker, SABR uses the centroid for each phoneme as an acoustic “anchor,” then applies Lasso regularization to
the method on a speaker-independent phoneme recognition task and a voice conversion task. Using a linear classifier,
SABR weights achieve significantly higher phoneme recognition rates than Mel frequency Cepstral coefficients. SABR weights can also be used directly to perform accent conversion without the need to train a speakerto-speaker regression model. |
Ahmed, B; Ali, H; Choi, J; Gutierrez-Osuna, R ReBreathe: A calibration protocol that improves stress/relax classification by relabeling deep breathing relaxation exercises Journal Article In: IEEE Transactions on Affective Computing, vol. in press, 2015. @article{ahmed2015taffc,
title = {ReBreathe: A calibration protocol that improves stress/relax classification by relabeling deep breathing relaxation exercises},
author = {B Ahmed and H Ali and J Choi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/ahmed2015taffc.pdf},
year = {2015},
date = {2015-08-01},
journal = {IEEE Transactions on Affective Computing},
volume = {in press},
keywords = {Health, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
Huang, J; Gutierrez-Osuna, R Detection of weak chemicals in strong backgrounds with a tunable infrared sensor Proceedings Article In: International Symposium on Olfaction and Electronic Nose, 2015. @inproceedings{huang2015isoen,
title = {Detection of weak chemicals in strong backgrounds with a tunable infrared sensor},
author = {J Huang and R Gutierrez-Osuna},
year = {2015},
date = {2015-06-28},
booktitle = {International Symposium on Olfaction and Electronic Nose},
keywords = {Active sensing, Chemical sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Nagle, H T; Gutierrez-Osuna, R; Suslick, K S; Persaud, K; Covington, J; Hodges, R D; Luckey, G; Crowell, J; Schiffman, S S Augmenting human odor assessments of cabin air quality of automobiles by instrumental measurements Proceedings Article In: International Symposium on Olfaction and Electronic Nose, 2015. @inproceedings{nagle2015isoen,
title = {Augmenting human odor assessments of cabin air quality of automobiles by instrumental measurements},
author = {H T Nagle and R Gutierrez-Osuna and K S Suslick and K Persaud and J Covington and R D Hodges and G Luckey and J Crowell and S S Schiffman},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/nagle2015isoen.pdf},
year = {2015},
date = {2015-06-28},
booktitle = {International Symposium on Olfaction and Electronic Nose},
keywords = {Chemical sensors, Machine olfaction},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Bhandari, R; Parnandi, A; Shipp, E; Ahmed, B; Gutierrez-Osuna, R Music-based respiratory biofeedback in visually-demanding tasks Proceedings Article In: 15th International Conference on New Interfaces for Musical Expression (NIME), 2015. @inproceedings{Bhandari2015nime,
title = {Music-based respiratory biofeedback in visually-demanding tasks},
author = {R Bhandari and A Parnandi and E Shipp and B Ahmed and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/Bhandari2015nime.pdf},
year = {2015},
date = {2015-05-31},
urldate = {2015-05-31},
booktitle = {15th International Conference on New Interfaces for Musical Expression (NIME)},
keywords = {Electrodermal activity, Games, Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Liberatore, C; Gutierrez-Osuna, R Joint Optimization of Anatomical and Gestural Parameters in a Physical Vocal Tract Model Proceedings Article In: ICASSP, IEEE 2015. @inproceedings{liberatore2015icassp,
title = {Joint Optimization of Anatomical and Gestural Parameters in a Physical Vocal Tract Model},
author = {C Liberatore and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/liberatore2015icassp.pdf},
year = {2015},
date = {2015-04-19},
booktitle = {ICASSP},
organization = {IEEE},
keywords = {Accent conversion, Articulatory inversion, Articulatory synthesis},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Shahin, M; Ahmed, B; Parnandi, A; Karappa, V; McKechnie, J; Ballard, K; Gutierrez-Osuna, R Tabby Talks: an automated tool for the assessment of childhood apraxia of speech Journal Article In: Speech Communication, vol. in press, 2015. @article{shahin2015specom,
title = {Tabby Talks: an automated tool for the assessment of childhood apraxia of speech},
author = {M Shahin and B Ahmed and A Parnandi and V Karappa and J McKechnie and K Ballard and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/shahin2015specom.pdf},
year = {2015},
date = {2015-04-02},
urldate = {2015-04-02},
journal = {Speech Communication},
volume = {in press},
keywords = {Childhood apraxia of speech, Games, Health, Mobile computing, Speech},
pubstate = {published},
tppubtype = {article}
}
|
Shipman, F; Gutierrez-Osuna, R; Shipman, T; Monteiro, C; Karappa, V Towards a Distributed Digital Library for Sign Language Content Proceedings Article In: Proc. ACM/IEEE Joint Conference on Digital Libraries, 2015. @inproceedings{shipman2015jcdl,
title = {Towards a Distributed Digital Library for Sign Language Content},
author = {F Shipman and R Gutierrez-Osuna and T Shipman and C Monteiro and V Karappa},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/shipman2015jcdl.pdf},
year = {2015},
date = {2015-04-02},
booktitle = {Proc. ACM/IEEE Joint Conference on Digital Libraries},
volume = {in press},
keywords = {Computer vision, Gestures, Pattern recognition},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Gupta, A; Gutierrez-Osuna, R; Christy, M; Capitanu, B; Auvil, L; Grumbach, L; Furuta, R; Mandell, L Automatic assessment of OCR quality in historical documents Proceedings Article In: Proc. AAAI, 2015. @inproceedings{gupta2015aaai,
title = {Automatic assessment of OCR quality in historical documents},
author = {A Gupta and R Gutierrez-Osuna and M Christy and B Capitanu and L Auvil and L Grumbach and R Furuta and L Mandell},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gupta2015aaai.pdf},
year = {2015},
date = {2015-01-25},
booktitle = {Proc. AAAI},
volume = {in press},
keywords = {OCR, Other, Pattern recognition},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Aryal, S; Gutierrez-Osuna, R Reduction of non-native accents through statistical parametric articulatory synthesis Journal Article In: Journal of the Acoustical Society of America, vol. 137, no. 1, pp. 433-446, 2015. @article{aryal2015jasa,
title = {Reduction of non-native accents through statistical parametric articulatory synthesis},
author = {S Aryal and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/aryal2015jasa.pdf},
year = {2015},
date = {2015-01-23},
journal = {Journal of the Acoustical Society of America},
volume = {137},
number = {1},
pages = {433-446},
keywords = {Accent conversion, Articulatory synthesis, Speech},
pubstate = {published},
tppubtype = {article}
}
|
Wang, Z; Wang, J; Zhang, S; Gong, Y Visual Tracking based on Online Sparse Feature Learning Journal Article In: Image and Vision Computing, vol. 38, no. 24--32, 2015. @article{wang2015visual,
title = {Visual Tracking based on Online Sparse Feature Learning},
author = {Z Wang and J Wang and S Zhang and Y Gong},
editor = {Elsevier},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/wang2015visual.pdf},
year = {2015},
date = {2015-01-01},
journal = {Image and Vision Computing},
volume = {38},
number = {24--32},
abstract = {Various visual tracking approaches have been proposed for robust target tracking, among which using sparse representation of the tracking target yields promising performance. Some earlier works in this line used a fixed subset of features to compress the target's appearance, which has limited modeling capacity between the target and the background, and could not accommodate their appearance change over long period of time. In this paper, we propose a visual tracking method by modeling targets with online-learned sparse features. We first extract high dimensional Haar-like features as an over-completed basis set, and then solve the feature selection problem in an efficient L1-regularized sparse-coding process. The selected low-dimensional representation best discriminates the target from its neighboring background. Next we use a naive Bayesian classifier to select the most-likely target candidate by a binary classification process. The online feature selection process happens when there are significant appearance changes identified by a thresholding strategy. In this way, our proposed method could work for long tracking tasks. At the same time, our comprehensive experimental evaluation has shown that the proposed methods achieve excellent running speed and higher accuracy over many state-of-the-art approaches.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Various visual tracking approaches have been proposed for robust target tracking, among which using sparse representation of the tracking target yields promising performance. Some earlier works in this line used a fixed subset of features to compress the target's appearance, which has limited modeling capacity between the target and the background, and could not accommodate their appearance change over long period of time. In this paper, we propose a visual tracking method by modeling targets with online-learned sparse features. We first extract high dimensional Haar-like features as an over-completed basis set, and then solve the feature selection problem in an efficient L1-regularized sparse-coding process. The selected low-dimensional representation best discriminates the target from its neighboring background. Next we use a naive Bayesian classifier to select the most-likely target candidate by a binary classification process. The online feature selection process happens when there are significant appearance changes identified by a thresholding strategy. In this way, our proposed method could work for long tracking tasks. At the same time, our comprehensive experimental evaluation has shown that the proposed methods achieve excellent running speed and higher accuracy over many state-of-the-art approaches. |
Huang, J; Gutierrez-Osuna, R Active wavelength selection for mixture analysis with tunable infrared detectors Journal Article In: Sensors and Actuators B: Chemical, vol. 208, pp. 245–257, 2015. @article{huang2014sab,
title = {Active wavelength selection for mixture analysis with tunable infrared detectors},
author = {J Huang and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/huang2014sab.pdf},
year = {2015},
date = {2015-01-01},
journal = {Sensors and Actuators B: Chemical},
volume = {208},
pages = {245–257},
keywords = {Active sensing, Chemical sensors, Infrared spectroscopy},
pubstate = {published},
tppubtype = {article}
}
|
2014
|
Li, J; Hodges, R D; Gutierrez-Osuna, R; Luckey, G; Crowell, J; Schiffman, S S; Nagle, H T Odor Assessment of Automobile Cabin Air by Machine Olfaction Proceedings Article In: Proc. IEEE Sensors Conference, 2014. @inproceedings{li2004sensorsconf,
title = {Odor Assessment of Automobile Cabin Air by Machine Olfaction},
author = {J Li and R D Hodges and R Gutierrez-Osuna and G Luckey and J Crowell and S S Schiffman and H T Nagle},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/li2004sensorsconf.pdf},
year = {2014},
date = {2014-11-02},
booktitle = {Proc. IEEE Sensors Conference},
keywords = {Chemical sensors, Electronic nose, Olfaction},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Lan, T; Aryal, S; Ahmed, B; Ballard, K; Gutierrez-Osuna, R Flappy Voice: An Interactive Game for Childhood Apraxia of Speech Therapy Proceedings Article In: Proc. CHI-PLAY, 2014. @inproceedings{lan2014chiplay,
title = {Flappy Voice: An Interactive Game for Childhood Apraxia of Speech Therapy},
author = {T Lan and S Aryal and B Ahmed and K Ballard and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/lan2014chiplay.pdf},
year = {2014},
date = {2014-10-19},
booktitle = {Proc. CHI-PLAY},
keywords = {Childhood apraxia of speech, Games, Health, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Al-Rihawi, R; Ahmed, B; Gutierrez-Osuna, R Dodging Stress With A Personalized Biofeedback Game Proceedings Article In: Proc. CHI-PLAY, 2014. @inproceedings{rami2014chiplay,
title = {Dodging Stress With A Personalized Biofeedback Game},
author = {R Al-Rihawi and B Ahmed and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/rami2014chiplay.pdf},
year = {2014},
date = {2014-10-19},
booktitle = {Proc. CHI-PLAY},
keywords = {Electrodermal activity, Games, Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Shahin, M; Ahmed, B; McKechnie, J; Ballard, K; Gutierrez-Osuna, R A comparison of GMM-HMM and DNN-HMM based pronunciation verification techniques for use in the assessment of childhood apraxia of speech Proceedings Article In: Proc. Interspeech, 2014. @inproceedings{mostafa2014interspeech,
title = {A comparison of GMM-HMM and DNN-HMM based pronunciation verification techniques for use in the assessment of childhood apraxia of speech},
author = {M Shahin and B Ahmed and J McKechnie and K Ballard and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/mostafa2014interspeech.pdf},
year = {2014},
date = {2014-09-14},
booktitle = {Proc. Interspeech},
keywords = {Childhood apraxia of speech, Health, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Christy, M; Auvil, L; Gutierrez-Osuna, R; Capitanu, B; Gupta, A; Grumbach, E Diagnosing Page Image Problems with Post-OCR Triage for eMOP Proceedings Article In: Proc. Digital Humanities Conference, 2014. @inproceedings{christy2014emopdhc,
title = {Diagnosing Page Image Problems with Post-OCR Triage for eMOP},
author = {M Christy and L Auvil and R Gutierrez-Osuna and B Capitanu and A Gupta and E Grumbach},
year = {2014},
date = {2014-07-08},
booktitle = {Proc. Digital Humanities Conference},
volume = {in press},
keywords = {OCR, Other, Pattern recognition},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Avnet, M S; Phillips, D; Bhattacharya, R; Gutierrez-Osuna, R; Malak, R; Mayer, R; Ntaimo, L; Quadrifoglio, L; Tsvetkov, P Toward an Interdisciplinary Program in Systems Engineering at Texas A&M University Proceedings Article In: Proc. 4th International Engineering Systems Symposium (CESUN 2014), 2014. @inproceedings{avnet2014systemsEngr,
title = {Toward an Interdisciplinary Program in Systems Engineering at Texas A&M University},
author = {M S Avnet and D Phillips and R Bhattacharya and R Gutierrez-Osuna and R Malak and R Mayer and L Ntaimo and L Quadrifoglio and P Tsvetkov},
year = {2014},
date = {2014-06-08},
booktitle = {Proc. 4th International Engineering Systems Symposium (CESUN 2014)},
keywords = {Other},
pubstate = {published},
tppubtype = {inproceedings}
}
|
McKechnie, J; Ballard, K; McCabe, P; Gutierrez-Osuna, R; Karappa, V; Parnandi, A; Shahin, M; Murray, E; Ahmed, B Tablet-based delivery of intensive speech therapy in children with Childhood Apraxia of Speech - Pilot Phase Proceedings Article In: Speech Pathology Australia National Conference, 2014. @inproceedings{jacqui2013australiaSLPconference,
title = {Tablet-based delivery of intensive speech therapy in children with Childhood Apraxia of Speech - Pilot Phase},
author = {J McKechnie and K Ballard and P McCabe and R Gutierrez-Osuna and V Karappa and A Parnandi and M Shahin and E Murray and B Ahmed},
year = {2014},
date = {2014-05-14},
urldate = {2014-05-14},
booktitle = {Speech Pathology Australia National Conference},
keywords = {Games, Health, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Karappa, V; Monteiro, C; Shipman, F; Gutierrez-Osuna, R Detection of sign-language content in video through polar motion profiles Proceedings Article In: Proc. 39th International Conference on Acoustics, Speech, and Signal Processing (ICASSP), pp. 1299-1303, 2014. @inproceedings{virendraasl2014icassp,
title = {Detection of sign-language content in video through polar motion profiles},
author = {V Karappa and C Monteiro and F Shipman and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/virendraasl2014icassp.pdf},
year = {2014},
date = {2014-05-09},
booktitle = {Proc. 39th International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
pages = {1299-1303},
keywords = {Computer vision, Gestures},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Aryal, S; Gutierrez-Osuna, R Accent conversion through cross-speaker articulatory synthesis Proceedings Article In: Proc. 39th International Conference on Acoustics, Speech, and Signal Processing (ICASSP), pp. 7744-7748, 2014. @inproceedings{sandesh2014icassp,
title = {Accent conversion through cross-speaker articulatory synthesis},
author = {S Aryal and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/sandesh2014icassp.pdf},
year = {2014},
date = {2014-05-09},
booktitle = {Proc. 39th International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
pages = {7744-7748},
keywords = {Accent conversion, Articulatory synthesis, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Aryal, S; Gutierrez-Osuna, R Can voice conversion be used to reduce non-native accents Proceedings Article In: Proc. 39th International Conference on Acoustics, Speech, and Signal Processing (ICASSP), pp. 7929-7933, 2014. @inproceedings{sandeshaccentconversion2014icassp,
title = {Can voice conversion be used to reduce non-native accents},
author = {S Aryal and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/sandeshaccentconversion2014icassp.pdf},
year = {2014},
date = {2014-05-09},
booktitle = {Proc. 39th International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
pages = {7929-7933},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Felps, D; Aryal, S; Gutierrez-Osuna, R Normalization of articulatory data through Procrustes transformations and analysis-by-synthesis Proceedings Article In: Proc. 39th International Conference on Acoustics, Speech, and Signal Processing (ICASSP), pp. 3051-3055, 2014. @inproceedings{danielprocrustes2014icassp,
title = {Normalization of articulatory data through Procrustes transformations and analysis-by-synthesis},
author = {D Felps and S Aryal and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/danielprocrustes2014icassp.pdf},
year = {2014},
date = {2014-05-09},
booktitle = {Proc. 39th International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
pages = {3051-3055},
keywords = {Accent conversion, Articulatory synthesis, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Parnandi, A; Gutierrez-Osuna, R A Comparative Study of Game Mechanics and Control Laws for an Adaptive Physiological Game Journal Article In: Journal on Multimodal User Interfaces, 2014. @article{avinash2014jmui,
title = {A Comparative Study of Game Mechanics and Control Laws for an Adaptive Physiological Game},
author = {A Parnandi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/avinash2014jmui.pdf},
year = {2014},
date = {2014-04-29},
journal = {Journal on Multimodal User Interfaces},
keywords = {Electrodermal activity, Games, Health, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
|
Harris, J; Vance, S; Fernandes, O; Parnandi, A; Gutierrez-Osuna, R Sonic Respiration: Controlling Respiration Rate Through Auditory Biofeedback Proceedings Article In: Proc. ACM CHI Conference on Human Factors in Computing Systems (CHI 2014) Works-in-Progress, 2014. @inproceedings{harris2014chi,
title = {Sonic Respiration: Controlling Respiration Rate Through Auditory Biofeedback},
author = {J Harris and S Vance and O Fernandes and A Parnandi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/harris2014chi.pdf},
year = {2014},
date = {2014-04-26},
urldate = {2014-04-26},
booktitle = {Proc. ACM CHI Conference on Human Factors in Computing Systems (CHI 2014) Works-in-Progress},
volume = {in press},
keywords = {Games, Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Perera-Lluna, A; Manivannan, K; Xu, P; Gutierrez-Osuna, R; Benner, C; Russell, B D Automatic Capacitor Bank Identification in Power Distribution Systems Journal Article In: Electric Power Systems Research, vol. in press, 2014. @article{alex2014epsr,
title = {Automatic Capacitor Bank Identification in Power Distribution Systems},
author = {A Perera-Lluna and K Manivannan and P Xu and R Gutierrez-Osuna and C Benner and B D Russell},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/alex2014epsr.pdf},
year = {2014},
date = {2014-02-06},
journal = {Electric Power Systems Research},
volume = {in press},
keywords = {Other, Pattern recognition},
pubstate = {published},
tppubtype = {article}
}
|
Yu, Y; Choe, Y; Gutierrez-Osuna, R Context-sensitive Intra-class Clustering Journal Article In: Pattern Recognition Letters, vol. 37, pp. 85-93, 2014. @article{yingwei2013prl,
title = {Context-sensitive Intra-class Clustering},
author = {Y Yu and Y Choe and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/yingwei2013prl.pdf},
year = {2014},
date = {2014-02-01},
journal = {Pattern Recognition Letters},
volume = {37},
pages = {85-93},
keywords = {Pattern recognition},
pubstate = {published},
tppubtype = {article}
}
|
Gosangi, R; Gutierrez-Osuna, R Active classification with arrays of tunable chemical sensors Journal Article In: Chemometrics and Intelligent Laboratory Systems, vol. 132, pp. 91-102, 2014. @article{rakesh2014cils,
title = {Active classification with arrays of tunable chemical sensors},
author = {R Gosangi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/rakesh2014cils.pdf},
year = {2014},
date = {2014-02-01},
journal = {Chemometrics and Intelligent Laboratory Systems},
volume = {132},
pages = {91-102},
keywords = {Active sensing, Metal-oxide sensors},
pubstate = {published},
tppubtype = {article}
}
|
2013
|
Parnandi, A; Ahmed, B; Shipp, E; Gutierrez-Osuna, R Chill-Out: Relaxation training through respiratory biofeedback in a mobile casual game Conference Fifth International Conference on Mobile Computing, Applications and Services (MobiCASE 2013), 2013. @conference{avimobicase2013,
title = {Chill-Out: Relaxation training through respiratory biofeedback in a mobile casual game},
author = {A Parnandi and B Ahmed and E Shipp and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/avimobicase2013.pdf},
year = {2013},
date = {2013-11-07},
booktitle = {Fifth International Conference on Mobile Computing, Applications and Services (MobiCASE 2013)},
keywords = {Electrodermal activity, Games, Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {conference}
}
|
Shipman, F; Gutierrez-Osuna, R; Monteiro, C Identifying Sign Language Videos in Video Sharing Sites Journal Article In: ACM Transactions on Accessible Computing, vol. in press, 2013. @article{Shipman2013,
title = {Identifying Sign Language Videos in Video Sharing Sites},
author = {F Shipman and R Gutierrez-Osuna and C Monteiro},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/Shipman2013.pdf},
year = {2013},
date = {2013-11-04},
journal = {ACM Transactions on Accessible Computing},
volume = {in press},
keywords = {Computer vision, Gestures},
pubstate = {published},
tppubtype = {article}
}
|
Parnandi, A; Karappa, V; Son, Y; Shahin, M; McKechnie, J; Ballard, K; Ahmed, B; Gutierrez-Osuna, R Architecture of an automated therapy tool for childhood apraxia of speech Conference The 15th International ACM SIGACCESS Conference on Computers and Accessibility (ASSETS), 2013. @conference{avinashassets2013,
title = {Architecture of an automated therapy tool for childhood apraxia of speech},
author = {A Parnandi and V Karappa and Y Son and M Shahin and J McKechnie and K Ballard and B Ahmed and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/avinashassets2013.pdf},
year = {2013},
date = {2013-10-21},
urldate = {2013-10-21},
booktitle = {The 15th International ACM SIGACCESS Conference on Computers and Accessibility (ASSETS)},
keywords = {Childhood apraxia of speech, Games, Health, Mobile computing, Speech},
pubstate = {published},
tppubtype = {conference}
}
|
Parnandi, A; Son, Y; Gutierrez-Osuna, R A Control-Theoretic Approach to Adaptive Physiological Games Conference Humaine Association Conference on Affective Computing and Intelligent Interaction (ACII), 2013. @conference{avigameacii,
title = {A Control-Theoretic Approach to Adaptive Physiological Games},
author = {A Parnandi and Y Son and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/avigameacii.pdf},
year = {2013},
date = {2013-09-02},
booktitle = {Humaine Association Conference on Affective Computing and Intelligent Interaction (ACII)},
keywords = {Electrodermal activity, Games, Health, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {conference}
}
|
Parnandi, A; Gutierrez-Osuna, R Contactless Measurement of Heart Rate Variability from Fluctuations in Pupillary Dilation Conference Humaine Association Conference on Affective Computing and Intelligent Interaction (ACII), 2013. @conference{avipupilacii,
title = {Contactless Measurement of Heart Rate Variability from Fluctuations in Pupillary Dilation},
author = {A Parnandi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/avipupilacii.pdf},
year = {2013},
date = {2013-09-02},
booktitle = {Humaine Association Conference on Affective Computing and Intelligent Interaction (ACII)},
keywords = {Contactless sensing, Health, Heart rate variability, Stress},
pubstate = {published},
tppubtype = {conference}
}
|
Aryal, S; Felps, D; Gutierrez-Osuna, R Foreign Accent Conversion through Voice Morphing Proceedings Article In: Interspeech, pp. 3077-3081, 2013. @inproceedings{aryal2013interspeech,
title = {Foreign Accent Conversion through Voice Morphing},
author = {S Aryal and D Felps and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/aryal2013interspeech.pdf},
year = {2013},
date = {2013-08-25},
booktitle = {Interspeech},
pages = {3077-3081},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Khan, H; Ahmed, B; Choi, J; Gutierrez-Osuna, R Using an Ambulatory Stress Monitoring Device to Identify Relaxation Due to Untrained Deep Breathing Conference 35th Annual International Conference of the IEEE Engineering in Medicine & Biology Society, 2013. @conference{hira2013,
title = {Using an Ambulatory Stress Monitoring Device to Identify Relaxation Due to Untrained Deep Breathing},
author = {H Khan and B Ahmed and J Choi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/hira2013.pdf},
year = {2013},
date = {2013-07-03},
booktitle = {35th Annual International Conference of the IEEE Engineering in Medicine & Biology Society},
pages = {n/a},
abstract = {We have developed a non-invasive stress monitoring device to analyze the physiological changes in a person while undergoing different tasks. Our main aim was to use the developed monitoring device to identify the efficacy of deep breathing as a relaxing activity in comparison to mentally stressful activities. A protocol with different mentally stressful activities intervened with regular sessions of deep breathing was designed. Participants were asked to perform the set of tasks in a lab setup. The data from three parameters i.e. heart rate, respiration and skin conductance was captured by the physiological sensors and was then analyzed. We found some very interesting results that subjects were not able to breathe properly and thus their stress level was high during the deep breathing exercise. Our results also validate the use of our device to accurately identify if the subjects were able to properly control their breathing to allow them to relax.},
keywords = {Stress, Wearable sensors},
pubstate = {published},
tppubtype = {conference}
}
We have developed a non-invasive stress monitoring device to analyze the physiological changes in a person while undergoing different tasks. Our main aim was to use the developed monitoring device to identify the efficacy of deep breathing as a relaxing activity in comparison to mentally stressful activities. A protocol with different mentally stressful activities intervened with regular sessions of deep breathing was designed. Participants were asked to perform the set of tasks in a lab setup. The data from three parameters i.e. heart rate, respiration and skin conductance was captured by the physiological sensors and was then analyzed. We found some very interesting results that subjects were not able to breathe properly and thus their stress level was high during the deep breathing exercise. Our results also validate the use of our device to accurately identify if the subjects were able to properly control their breathing to allow them to relax. |
Gosangi, R; Gutierrez-Osuna, R Active temperature modulation of metal-oxide sensors for quantitative analysis of gas mixtures Journal Article In: Sensors and Actuators B: Chemical, vol. 185, pp. 201-210, 2013. @article{rakeshmixturessab13,
title = {Active temperature modulation of metal-oxide sensors for quantitative analysis of gas mixtures},
author = {R Gosangi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/rakeshmixturessab13.pdf},
year = {2013},
date = {2013-04-15},
journal = {Sensors and Actuators B: Chemical},
volume = {185},
pages = {201-210},
keywords = {Active sensing, Chemical sensors, Metal-oxide sensors},
pubstate = {published},
tppubtype = {article}
}
|
Aryal, S; Gutierrez-Osuna, R Articulatory inversion and synthesis: towards articulatory-based modification of speech Proceedings Article In: 38th International Conference on Acoustics, Speech, and Signal Processing (ICASSP), pp. 7952-7956, 2013. @inproceedings{aryal2013icassp,
title = {Articulatory inversion and synthesis: towards articulatory-based modification of speech},
author = {S Aryal and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/aryal2013icassp.pdf},
year = {2013},
date = {2013-02-28},
booktitle = {38th International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
pages = {7952-7956},
keywords = {Articulatory inversion, Articulatory synthesis, Speech},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Huang, J; Gutierrez-Osuna, R Active analysis of chemical mixtures with multi-modal sparse non-negative least squares Conference 38th International Conference on Acoustics, Speech, and Signal Processing (ICASSP), 2013. @conference{jinicassp2013,
title = {Active analysis of chemical mixtures with multi-modal sparse non-negative least squares},
author = {J Huang and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/jinicassp2013.pdf},
year = {2013},
date = {2013-02-28},
booktitle = {38th International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
keywords = {Active sensing, Chemical sensors, Infrared spectroscopy},
pubstate = {published},
tppubtype = {conference}
}
|
Lee, J; Gutierrez-Osuna, R; Young, S SILK: Scale-space integrated Lucas-Kanade image registration for super-resolution from video Conference 38th International Conference on Acoustics, Speech, and Signal Processing (ICASSP), 2013. @conference{josephicassp2013,
title = {SILK: Scale-space integrated Lucas-Kanade image registration for super-resolution from video},
author = {J Lee and R Gutierrez-Osuna and S Young},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/josephicassp2013.pdf},
year = {2013},
date = {2013-02-28},
booktitle = {38th International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
keywords = {Computer vision},
pubstate = {published},
tppubtype = {conference}
}
|
2012
|
Gosangi, R; Gutierrez-Osuna, R Active Decomposition and Sensing in Networks of Distributed Chemical Sensors Technical Report 2012. @techreport{gosangi2012techreport,
title = {Active Decomposition and Sensing in Networks of Distributed Chemical Sensors},
author = {R Gosangi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gosangi2012techreport.pdf},
year = {2012},
date = {2012-12-05},
abstract = {Active sensing enables a sensor to optimize its tunings on-the-fly based on information obtained from previous measurements. When applied to networks of distributed sensors, however, active sensing becomes computationally impractical due to the combinatorial number of sensing configurations. To address this problem, we present an active decomposition and sensing (ADS) method that combines the advantages of classifier decomposition with those of active sensing. Namely, we use class posteriors to decompose the problem across the sensors in the network. Each sensor then applies active sensing to select the next tuning to solve its specific subproblem. As a result, the method scales linearly (rather than combinatorially) with the number of sensors. We validate ADS on a database of infrared absorption spectroscopy containing 50 chemicals. Our results show that active decomposition improves classification performance and reduces sensing costs when compared to using active sensing only at the node level.},
keywords = {Active sensing, Chemical sensors},
pubstate = {published},
tppubtype = {techreport}
}
Active sensing enables a sensor to optimize its tunings on-the-fly based on information obtained from previous measurements. When applied to networks of distributed sensors, however, active sensing becomes computationally impractical due to the combinatorial number of sensing configurations. To address this problem, we present an active decomposition and sensing (ADS) method that combines the advantages of classifier decomposition with those of active sensing. Namely, we use class posteriors to decompose the problem across the sensors in the network. Each sensor then applies active sensing to select the next tuning to solve its specific subproblem. As a result, the method scales linearly (rather than combinatorially) with the number of sensors. We validate ADS on a database of infrared absorption spectroscopy containing 50 chemicals. Our results show that active decomposition improves classification performance and reduces sensing costs when compared to using active sensing only at the node level. |
Huang, J; Gutierrez-Osuna, R Active Analysis of Chemical Mixtures with Multi-modal Sparse Non-negative Least Sqares Technical Report 2012. @techreport{huang2012techreport,
title = {Active Analysis of Chemical Mixtures with Multi-modal Sparse Non-negative Least Sqares},
author = {J Huang and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/huang2012techreport.pdf},
year = {2012},
date = {2012-12-05},
abstract = {New sensor technologies such as Fabry-Pérot interferometers (FPI) offer low-cost and portable alternatives to traditional infrared absorption spectroscopy for chemical analysis. However, with FPIs the absorption spectrum has to be measured one wavelength at a time. In this work, we propose an active-sensing framework to select a subset of wavelengths that best separates the specific components of a chemical mixture. Compared to passive feature-selection approaches, in which the subset is elected offline, active sensing selects the next feature on-the-fly based on previous measurements so as to reduce uncertainty. We propose a novel multi-modal non-negative least squares method (MM-NNLS) to solve the underlying linear system, which has multiple near-optimal solutions. We tested the framework on mixture problems of up to 10 components from a library of 100 chemicals. MM-NNLS can solve complex mixtures using only a small number of measurements, and outperforms passive approaches in terms of sensing efficiency and stability},
keywords = {Active sensing, Chemical sensors, Infrared spectroscopy},
pubstate = {published},
tppubtype = {techreport}
}
New sensor technologies such as Fabry-Pérot interferometers (FPI) offer low-cost and portable alternatives to traditional infrared absorption spectroscopy for chemical analysis. However, with FPIs the absorption spectrum has to be measured one wavelength at a time. In this work, we propose an active-sensing framework to select a subset of wavelengths that best separates the specific components of a chemical mixture. Compared to passive feature-selection approaches, in which the subset is elected offline, active sensing selects the next feature on-the-fly based on previous measurements so as to reduce uncertainty. We propose a novel multi-modal non-negative least squares method (MM-NNLS) to solve the underlying linear system, which has multiple near-optimal solutions. We tested the framework on mixture problems of up to 10 components from a library of 100 chemicals. MM-NNLS can solve complex mixtures using only a small number of measurements, and outperforms passive approaches in terms of sensing efficiency and stability |
Parnandi, A; Gutierrez-Osuna, R Contactless Measurement of Heart Rate Variability from Pupillary Fluctuations Technical Report 2012. @techreport{parnandi2012techreport,
title = {Contactless Measurement of Heart Rate Variability from Pupillary Fluctuations},
author = {A Parnandi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/parnandi2012techreport.pdf},
year = {2012},
date = {2012-12-04},
abstract = {The ability to measure a person’s physiological parameters in a contactless fashion without attaching electrodes to the skin has tremendous potential in making healthcare delivery more efficient. In this paper, we present a proof-of-concept method for measuring one such vital parameter, heart rate variability (HRV), in a contactless fashion from the spontaneous pupillary fluctuations. Pupillary measurements are done using a remote eye tracker for imaging and an integro-differential algorithm for the segmentation of the pupil-iris boundary. We estimate HRV from energy distribution in the low frequency (LF) (0.04 to 0.15 Hz) and high frequency (HF) (0.15 to 0.4 Hz) bands of the power spectrum of the pupillary fluctuations. In our study, we noted statistically significant correlation between the estimated HRV and the ground truth measures under a range of breathing conditions and under different illumination levels. The high degree of agreement evident in our results suggests that pupillary fluctuations obtained in a contactless fashion can be a reliable indicator of HRV.},
keywords = {Contactless sensing, Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {techreport}
}
The ability to measure a person’s physiological parameters in a contactless fashion without attaching electrodes to the skin has tremendous potential in making healthcare delivery more efficient. In this paper, we present a proof-of-concept method for measuring one such vital parameter, heart rate variability (HRV), in a contactless fashion from the spontaneous pupillary fluctuations. Pupillary measurements are done using a remote eye tracker for imaging and an integro-differential algorithm for the segmentation of the pupil-iris boundary. We estimate HRV from energy distribution in the low frequency (LF) (0.04 to 0.15 Hz) and high frequency (HF) (0.15 to 0.4 Hz) bands of the power spectrum of the pupillary fluctuations. In our study, we noted statistically significant correlation between the estimated HRV and the ground truth measures under a range of breathing conditions and under different illumination levels. The high degree of agreement evident in our results suggests that pupillary fluctuations obtained in a contactless fashion can be a reliable indicator of HRV. |
Aryal, S; Gutierrez-Osuna, R Articulatory Inversion and Synthesis: Towards Articulatory-Based Modification of Speech Technical Report 2012. @techreport{aryal2012techreport,
title = {Articulatory Inversion and Synthesis: Towards Articulatory-Based Modification of Speech},
author = {S Aryal and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/aryal2012techreport.pdf},
year = {2012},
date = {2012-12-04},
abstract = {Certain speech modifications, such as changes in foreign/regional accents or articulatory styles, are performed more effectively in the articulatory domain than in the acoustic domain. Though measuring articulators is cumbersome, articulatory parameters may be estimated from acoustics through inversion. In this paper, we study the impact on synthesis quality when articulators predicted from acoustics are used in articulatory synthesis. For this purpose, we trained a GMM articulatory synthesizer and drove it with articulators predicted with an RBF-based inversion model. Using inverted instead of measured articulators degraded synthesis quality, as measured through Mel cepstral distortion and subjective tests. However, retraining the synthesizer with predicted articulators not only reversed the effect of errors introduced during inversion but also improved synthesis quality relative to using measured articulators. These results suggest that inverted articulators do not compromise synthesis quality, and open up the possibility of performing speech modification in the articulatory domain through inversion.},
keywords = {Articulatory inversion, Articulatory synthesis, Speech},
pubstate = {published},
tppubtype = {techreport}
}
Certain speech modifications, such as changes in foreign/regional accents or articulatory styles, are performed more effectively in the articulatory domain than in the acoustic domain. Though measuring articulators is cumbersome, articulatory parameters may be estimated from acoustics through inversion. In this paper, we study the impact on synthesis quality when articulators predicted from acoustics are used in articulatory synthesis. For this purpose, we trained a GMM articulatory synthesizer and drove it with articulators predicted with an RBF-based inversion model. Using inverted instead of measured articulators degraded synthesis quality, as measured through Mel cepstral distortion and subjective tests. However, retraining the synthesizer with predicted articulators not only reversed the effect of errors introduced during inversion but also improved synthesis quality relative to using measured articulators. These results suggest that inverted articulators do not compromise synthesis quality, and open up the possibility of performing speech modification in the articulatory domain through inversion. |
Aryal, S; Huang, J; Felps, D; Gutierrez-Osuna, R Boosting Automatic Speech Recognition through Articulatory Inversion Technical Report 2012. @techreport{aryal2012techreport-2,
title = {Boosting Automatic Speech Recognition through Articulatory Inversion},
author = {S Aryal and J Huang and D Felps and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/aryal2012techreport-2.pdf},
year = {2012},
date = {2012-12-04},
abstract = {This paper explores whether articulatory features predicted from speech acoustics through inversion may be used to boost the recognition of context-dependent units when combined with acoustic features. For this purpose, we performed articulatory inversion on a corpus containing acoustic and electromagnetic articulography recordings from a single speaker. We then compared the performance of an HMM-based diphone classifier on the individual feature sets (acoustic, articulatory, inversion) as well as on their combinations. To make good use of the limited corpus, we used a factorized representation that first classified diphones into broad overlapping categories and then combined them using a maximum-a-posteriori criterion. When comparing the individual feature sets, our results show no degradation in classification performance when predicted articulators are used instead of ground-truth articulators. Further, performance on the acoustic feature set improved by 10% when adding ground-truth articulators and by 5% when adding predicted articulators.},
keywords = {Articulatory inversion},
pubstate = {published},
tppubtype = {techreport}
}
This paper explores whether articulatory features predicted from speech acoustics through inversion may be used to boost the recognition of context-dependent units when combined with acoustic features. For this purpose, we performed articulatory inversion on a corpus containing acoustic and electromagnetic articulography recordings from a single speaker. We then compared the performance of an HMM-based diphone classifier on the individual feature sets (acoustic, articulatory, inversion) as well as on their combinations. To make good use of the limited corpus, we used a factorized representation that first classified diphones into broad overlapping categories and then combined them using a maximum-a-posteriori criterion. When comparing the individual feature sets, our results show no degradation in classification performance when predicted articulators are used instead of ground-truth articulators. Further, performance on the acoustic feature set improved by 10% when adding ground-truth articulators and by 5% when adding predicted articulators. |
Monteiro, C; Gutierrez-Osuna, R; Shipman, F Design and Evaluation of Classifier for Identifying Sign Language Videos in Video Sharing Sites Conference 13th International ACM SIGACCESS Conference on Computers and Accessibility (ASSETS 2012)., 2012. @conference{monteiro2012assets,
title = {Design and Evaluation of Classifier for Identifying Sign Language Videos in Video Sharing Sites},
author = {C Monteiro and R Gutierrez-Osuna and F Shipman},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/monteiro2012assets.pdf},
year = {2012},
date = {2012-10-22},
booktitle = {13th International ACM SIGACCESS Conference on Computers and Accessibility (ASSETS 2012).},
abstract = {Video sharing sites provide an opportunity for the collection and use of sign language presentations about a wide range of topics. Currently, locating sign language videos (SL videos) in such sharing sites relies on the existence and accuracy of tags, titles or other metadata indicating the content is in sign language. In this paper, we describe the design and evaluation of a classifier for distinguishing between sign language videos and other videos. A test collection of SL videos and videos likely to be incorrectly recognized as SL videos (likely false positives) was created for evaluating alternative classifiers. Five video features thought to be potentially valuable for this task were developed based on common video analysis techniques. A comparison of the relative value of the five video features shows that a measure of the symmetry of movement relative to the face is the best feature for distinguishing sign language videos. Overall, an SVM classifier provided with all five features achieves 82% precision and 90% recall when tested on the challenging test collection. The performance would be considerably higher when applied to the more varied collections of large video sharing sites.},
keywords = {Computer vision, Gestures},
pubstate = {published},
tppubtype = {conference}
}
Video sharing sites provide an opportunity for the collection and use of sign language presentations about a wide range of topics. Currently, locating sign language videos (SL videos) in such sharing sites relies on the existence and accuracy of tags, titles or other metadata indicating the content is in sign language. In this paper, we describe the design and evaluation of a classifier for distinguishing between sign language videos and other videos. A test collection of SL videos and videos likely to be incorrectly recognized as SL videos (likely false positives) was created for evaluating alternative classifiers. Five video features thought to be potentially valuable for this task were developed based on common video analysis techniques. A comparison of the relative value of the five video features shows that a measure of the symmetry of movement relative to the face is the best feature for distinguishing sign language videos. Overall, an SVM classifier provided with all five features achieves 82% precision and 90% recall when tested on the challenging test collection. The performance would be considerably higher when applied to the more varied collections of large video sharing sites. |
Son, Y; Parnandi, A; Gutierrez-Osuna, R A Control-Theoretic Approach to Adaptive Physiological Games Technical Report 2012. @techreport{son2012techreport,
title = {A Control-Theoretic Approach to Adaptive Physiological Games},
author = {Y Son and A Parnandi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/son2012techreport.pdf},
year = {2012},
date = {2012-09-21},
abstract = {This paper presents an adaptive biofeedback videogame
that aims to maintain the player’s arousal level at an
optimum level by monitoring physiological signals and
manipulating game difficulty accordingly. We use concepts
from classical control theory to model the interaction
between human physiology and game difficulty during
game play. Based on this control model, we have developed
a real-time car-racing game with adaptive game mechanics.
Specifically, we utilized car speed, road visibility, and
steering jitter as three mechanisms to manipulate game
difficulty. We propose quantitative measures to characterize
the extent to which these three game adaptations can
manipulate the player’s arousal. For this purpose, we used
electrodermal activity (EDA) as a physiological correlate of
arousal. We have validated our approach by conducting
experimental trials with 20 subjects in both open-loop (no
feedback) and closed-loop (negative feedback) conditions.
Our results show statistically significant differences among
the three game mechanics in terms of their effectiveness.
Specifically, manipulating car speed provides higher
arousal levels than modulating road visibility or vehicle
steering. Finally, we discuss the theoretical and practical
implications of our approach},
keywords = {Electrodermal activity, Games, Health, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {techreport}
}
This paper presents an adaptive biofeedback videogame
that aims to maintain the player’s arousal level at an
optimum level by monitoring physiological signals and
manipulating game difficulty accordingly. We use concepts
from classical control theory to model the interaction
between human physiology and game difficulty during
game play. Based on this control model, we have developed
a real-time car-racing game with adaptive game mechanics.
Specifically, we utilized car speed, road visibility, and
steering jitter as three mechanisms to manipulate game
difficulty. We propose quantitative measures to characterize
the extent to which these three game adaptations can
manipulate the player’s arousal. For this purpose, we used
electrodermal activity (EDA) as a physiological correlate of
arousal. We have validated our approach by conducting
experimental trials with 20 subjects in both open-loop (no
feedback) and closed-loop (negative feedback) conditions.
Our results show statistically significant differences among
the three game mechanics in terms of their effectiveness.
Specifically, manipulating car speed provides higher
arousal levels than modulating road visibility or vehicle
steering. Finally, we discuss the theoretical and practical
implications of our approach |
Huang, J; Gosangi, R; Gutierrez-Osuna, R Active Concentration-Independent Chemical Identification with a Tunable Infrared Sensor Journal Article In: Sensors Journal, IEEE, 2012. @article{huang2012sj,
title = {Active Concentration-Independent Chemical Identification with a Tunable Infrared Sensor},
author = {J Huang and R Gosangi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/huang2012sj.pdf},
year = {2012},
date = {2012-09-03},
journal = {Sensors Journal, IEEE},
abstract = {This paper presents an active sensing framework for concentration-independent identification of volatile chemicals using a tunable infrared interferometer. The framework operates in real time to generate a sequence of absorption lines that can best discriminate among a given set of chemicals. The active-sensing algorithm was previously developed to optimize temperature programs for metal-oxide chemosensors. Here, we adapt it to tune a non-dispersive infrared spectroscope based on a Fabry-Perot interferometer (FPI). We also extend this framework to allow the identification of chemical samples irrespective of their concentrations. Namely, we use non-negative matrix factorization (NMF) to create concentration-independent absorption profiles of different chemicals, and then employ linear least squares to fit sensor observations to the response profiles. We tested the framework on a simulated classification problem with 27 chemicals and compared against a passive sensing approach; active sensing consistently outperformed passive sensing in terms of classification performance for various sensing budgets and at various levels of sensor noise. We also validated the approach experimentally using a commercial FPI sensor and a database of eight household chemicals. Our results show the method is able to predict the sample identity irrespective of concentration.},
keywords = {Active sensing, Chemical sensors, Infrared spectroscopy},
pubstate = {published},
tppubtype = {article}
}
This paper presents an active sensing framework for concentration-independent identification of volatile chemicals using a tunable infrared interferometer. The framework operates in real time to generate a sequence of absorption lines that can best discriminate among a given set of chemicals. The active-sensing algorithm was previously developed to optimize temperature programs for metal-oxide chemosensors. Here, we adapt it to tune a non-dispersive infrared spectroscope based on a Fabry-Perot interferometer (FPI). We also extend this framework to allow the identification of chemical samples irrespective of their concentrations. Namely, we use non-negative matrix factorization (NMF) to create concentration-independent absorption profiles of different chemicals, and then employ linear least squares to fit sensor observations to the response profiles. We tested the framework on a simulated classification problem with 27 chemicals and compared against a passive sensing approach; active sensing consistently outperformed passive sensing in terms of classification performance for various sensing budgets and at various levels of sensor noise. We also validated the approach experimentally using a commercial FPI sensor and a database of eight household chemicals. Our results show the method is able to predict the sample identity irrespective of concentration. |
Masood, K; Choi, J; Ahmed, B; Gutierrez-Osuna, R Consistency and Validity of Self-reporting Scores in Stress Measurement Surveys Conference 2012 Annual International Conference of the IEEE Engineering in Medicine and Biology Society (EMBS), 2012. @conference{masood2012embs,
title = {Consistency and Validity of Self-reporting Scores in Stress Measurement Surveys},
author = {K Masood and J Choi and B Ahmed and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/masood2012embs.pdf},
year = {2012},
date = {2012-09-01},
booktitle = {2012 Annual International Conference of the IEEE Engineering in Medicine and Biology Society (EMBS)},
pages = {4895-4898},
abstract = {Stress has been attributed to physiological and psychological demands that exceed the natural regulatory capacity of a person. Chronic stress is not only a catalyst for diseases such as hypertension, diabetes, insomnia but may also lead to social problems such as marriage breakups, suicide and violence. Objective assessment of stress is difficult so self-reports are commonly used to indicate the severity of stress. However, empirical information on the validity of self-reports is limited. The present study investigated the authenticity and validity of different self-report surveys. An analysis, based on a three-pronged strategy, was performed on these surveys. It was concluded that although subjects are prone to systematic error in reporting, self-reports can provide a useful substitute for data modeling specifically in stress evaluation where other objective assessments such as determination of stress using only physiological response are difficult.},
keywords = {Health, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {conference}
}
Stress has been attributed to physiological and psychological demands that exceed the natural regulatory capacity of a person. Chronic stress is not only a catalyst for diseases such as hypertension, diabetes, insomnia but may also lead to social problems such as marriage breakups, suicide and violence. Objective assessment of stress is difficult so self-reports are commonly used to indicate the severity of stress. However, empirical information on the validity of self-reports is limited. The present study investigated the authenticity and validity of different self-report surveys. An analysis, based on a three-pronged strategy, was performed on these surveys. It was concluded that although subjects are prone to systematic error in reporting, self-reports can provide a useful substitute for data modeling specifically in stress evaluation where other objective assessments such as determination of stress using only physiological response are difficult. |
Parnandi, A; Son, Y; Shahin, M; Ahmed, B; Gutierrez-Osuna, R Architecture of an Automated Therapy Tool for Childhood Apraxia of Speech Technical Report 2012. @techreport{parnandi2012techreport-2,
title = {Architecture of an Automated Therapy Tool for Childhood Apraxia of Speech},
author = {A Parnandi and Y Son and M Shahin and B Ahmed and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/parnandi2012techreport-2.pdf},
year = {2012},
date = {2012-08-21},
urldate = {2012-08-21},
abstract = {We present a multi-tier architecture for automating the administration of speech therapy to children suffering from apraxia of speech. This architecture follows a client-server model and facilitates task-oriented remote therapeutic training in home settings. The therapy regimen is remotely assigned to the child by a speech therapist based on a standardized protocol. We utilize tablet PCs to provide stimuli to the children and record their speech response. The speech data is then streamed to a back-end server running a specialized speech-processing module to identify errors and quantify the progress of the child. These automated results allow the therapist to closely monitor the performance of each child, provide relevant feedback, and adapt the training program as needed. Our proposed architecture can accommodate a variety of interaction modalities that can serve as a complement to traditional face-to-face speech practice. In this paper we describe the client-server architecture, the middleware tools upon which the system has been built, and the speechprocessing tools for automatically scoring the patients’ speech.},
keywords = {Games, Health, Mobile computing, Speech},
pubstate = {published},
tppubtype = {techreport}
}
We present a multi-tier architecture for automating the administration of speech therapy to children suffering from apraxia of speech. This architecture follows a client-server model and facilitates task-oriented remote therapeutic training in home settings. The therapy regimen is remotely assigned to the child by a speech therapist based on a standardized protocol. We utilize tablet PCs to provide stimuli to the children and record their speech response. The speech data is then streamed to a back-end server running a specialized speech-processing module to identify errors and quantify the progress of the child. These automated results allow the therapist to closely monitor the performance of each child, provide relevant feedback, and adapt the training program as needed. Our proposed architecture can accommodate a variety of interaction modalities that can serve as a complement to traditional face-to-face speech practice. In this paper we describe the client-server architecture, the middleware tools upon which the system has been built, and the speechprocessing tools for automatically scoring the patients’ speech. |
Alamudun, F; Choi, J; Gutierrez-Osuna, R; Khan, H; Ahmed, B Removal of Subject-Dependent and Activity-Dependent Variation in Physiological Measures of Stress Conference Proceedings of Pervasive Computing Technologies for Healthcare, 2012, ISBN: 978-1-936968-43-5. @conference{alamudun2012phealth,
title = {Removal of Subject-Dependent and Activity-Dependent Variation in Physiological Measures of Stress},
author = {F Alamudun and J Choi and R Gutierrez-Osuna and H Khan and B Ahmed},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/alamudun2012phealth.pdf},
isbn = {978-1-936968-43-5},
year = {2012},
date = {2012-05-21},
booktitle = {Proceedings of Pervasive Computing Technologies for Healthcare},
pages = {115},
abstract = {The ability to monitor stress levels in daily life can provide valuable information to patients and their caretakers, help identify potential stressors, determine appropriate interventions, and monitor their effectiveness. Wearable sensor technology makes it now possible to measure non-invasively a number of physiological correlates of stress, from skin conductance to heart rate variability. These measures, however, show large individual differences and are also correlated with the physical activity of the subject. In this paper, we propose two multivariate signal processing techniques to reduce the effect of both forms of interference. The first method is an unsupervised technique that removes any systematic variation that is orthogonal to the dependent variable, in this case physiological stress. In contrast, the second method is a supervised technique that first projects the data into a subspace that emphasizes these systematic variations, and then removes them from the data. The two methods were validated on an experimental dataset containing physiological recordings from multiple subjects performing physical and/or mental activities. When compared to z-score normalization, the standard method for removing individual differences, our methods can reduce stress prediction errors by as much as 50%.},
keywords = {Electrodermal activity, Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {conference}
}
The ability to monitor stress levels in daily life can provide valuable information to patients and their caretakers, help identify potential stressors, determine appropriate interventions, and monitor their effectiveness. Wearable sensor technology makes it now possible to measure non-invasively a number of physiological correlates of stress, from skin conductance to heart rate variability. These measures, however, show large individual differences and are also correlated with the physical activity of the subject. In this paper, we propose two multivariate signal processing techniques to reduce the effect of both forms of interference. The first method is an unsupervised technique that removes any systematic variation that is orthogonal to the dependent variable, in this case physiological stress. In contrast, the second method is a supervised technique that first projects the data into a subspace that emphasizes these systematic variations, and then removes them from the data. The two methods were validated on an experimental dataset containing physiological recordings from multiple subjects performing physical and/or mental activities. When compared to z-score normalization, the standard method for removing individual differences, our methods can reduce stress prediction errors by as much as 50%. |
Choi, J; Ahmed, B; Gutierrez-Osuna, R Development and Evaluation of an Ambulatory Stress Monitor Based on Wearable Sensors Journal Article In: IEEE Transactions on Information Technology in Biomedicine, no. 99, pp. 279 - 286, 2012. @article{choi2012titb,
title = {Development and Evaluation of an Ambulatory Stress Monitor Based on Wearable Sensors},
author = {J Choi and B Ahmed and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/choi2012titb.pdf},
year = {2012},
date = {2012-03-01},
journal = {IEEE Transactions on Information Technology in Biomedicine},
number = {99},
pages = {279 - 286},
publisher = {IEEE},
abstract = {Chronic stress is endemic to modern society. However, as it is unfeasible for physicians to continuously monitor stress levels, its diagnosis is nontrivial. Wireless body sensor networks offer opportunities to ubiquitously detect and monitor mental stress levels, enabling improved diagnosis, and early treatment. This article describes the development of a wearable sensor platform to monitor a number of physiological correlates of mental stress. We discuss tradeoffs in both system design and sensor selection to balance information content and wearability. Using experimental signals collected from the wearable sensor, we describe a selected number of physiological features that show good correlation with mental stress. In particular, we propose a new spectral feature that estimates the balance of the autonomic nervous system by combining information from the power spectral density of respiration and heart rate variability. We validate the effectiveness of our approach on a binary discrimination problem when subjects are placed under two psychophysiological conditions: mental stress and relaxation. When used in a logistic regression model, our feature set is able to discriminate between these two mental states with a success rate of 81% across subjects.},
keywords = {Electrodermal activity, Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
Chronic stress is endemic to modern society. However, as it is unfeasible for physicians to continuously monitor stress levels, its diagnosis is nontrivial. Wireless body sensor networks offer opportunities to ubiquitously detect and monitor mental stress levels, enabling improved diagnosis, and early treatment. This article describes the development of a wearable sensor platform to monitor a number of physiological correlates of mental stress. We discuss tradeoffs in both system design and sensor selection to balance information content and wearability. Using experimental signals collected from the wearable sensor, we describe a selected number of physiological features that show good correlation with mental stress. In particular, we propose a new spectral feature that estimates the balance of the autonomic nervous system by combining information from the power spectral density of respiration and heart rate variability. We validate the effectiveness of our approach on a binary discrimination problem when subjects are placed under two psychophysiological conditions: mental stress and relaxation. When used in a logistic regression model, our feature set is able to discriminate between these two mental states with a success rate of 81% across subjects. |
Lucchese, G; Field, M; Ho, J; Gutierrez-Osuna, R; Hammond, T GestureCommander: continuous touch-based gesture prediction Conference Proceedings of the 2012 ACM annual conference extended abstracts on Human Factors in Computing Systems Extended Abstracts, ACM 2012. @conference{lucchese2012chi,
title = {GestureCommander: continuous touch-based gesture prediction},
author = {G Lucchese and M Field and J Ho and R Gutierrez-Osuna and T Hammond},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/lucchese2012chi.pdf},
year = {2012},
date = {2012-01-01},
booktitle = {Proceedings of the 2012 ACM annual conference extended abstracts on Human Factors in Computing Systems Extended Abstracts},
pages = {1925--1930},
organization = {ACM},
abstract = {GestureCommander is a touch-based gesture control system for mobile devices that is able to recognize gestures as they are being performed. Continuous recognition allows the system to provide visual feedback to the user and to anticipate user commands to possibly decrease perceived response time. To achieve this goal we employ two Hidden Markov Model (HMM) systems, one for recognition and another for generating visual feedback. We analyze a set of geometric features used in other gesture recognition systems and determine a subset that works best for HMMs. Finally we demonstrate the practicality of our recognition HMMs in a proof of concept mobile application for Google's Android mobile platform that has a recognition accuracy rate of 96% over 15 distinct gestures.},
keywords = {Gestures, Mobile computing},
pubstate = {published},
tppubtype = {conference}
}
GestureCommander is a touch-based gesture control system for mobile devices that is able to recognize gestures as they are being performed. Continuous recognition allows the system to provide visual feedback to the user and to anticipate user commands to possibly decrease perceived response time. To achieve this goal we employ two Hidden Markov Model (HMM) systems, one for recognition and another for generating visual feedback. We analyze a set of geometric features used in other gesture recognition systems and determine a subset that works best for HMMs. Finally we demonstrate the practicality of our recognition HMMs in a proof of concept mobile application for Google's Android mobile platform that has a recognition accuracy rate of 96% over 15 distinct gestures. |
Felps, D; Geng, C; Gutierrez-Osuna, R Foreign accent conversion through concatenative synthesis in the articulatory domain Journal Article In: IEEE Transactions on Audio, Speech and Language Processing, 2012. @article{felps2012taslp,
title = {Foreign accent conversion through concatenative synthesis in the articulatory domain},
author = {D Felps and C Geng and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/felps2012taslp.pdf},
year = {2012},
date = {2012-01-01},
journal = {IEEE Transactions on Audio, Speech and Language Processing},
abstract = {We propose a concatenative synthesis approach to the problem of foreign accent conversion. The approach consists of replacing the most accented portions of nonnative speech with alternative segments from a corpus of the speaker’s own speech based on their similarity to those from a reference native speaker. We propose and compare two approaches for selecting units, one based on acoustic similarity [e.g., mel frequency cepstral coeffi-cients (MFCCs)] and a second one based on articulatory similarity, as measured through electromagnetic articulography (EMA). Our hypothesis is that articulatory features provide a better metric for linguistic similarity across speakers than acoustic features. To test this hypothesis, we recorded an articulatory-acoustic corpus from a native and a nonnative speaker, and
evaluated the two speech representations (acoustic versus articulatory) through a series of perceptual experiments. Formal listening tests indicate that the approach can achieve a 20% reduction in perceived accent, but also reveal a strong coupling between accent and speaker identity. To address this issue, we disguised original and resynthesized utterances by altering their average pitch and normalizing vocal tract length. An additional listening experiment supports the hypothesis that articulatory features are less speaker dependent than acoustic features.},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {article}
}
We propose a concatenative synthesis approach to the problem of foreign accent conversion. The approach consists of replacing the most accented portions of nonnative speech with alternative segments from a corpus of the speaker’s own speech based on their similarity to those from a reference native speaker. We propose and compare two approaches for selecting units, one based on acoustic similarity [e.g., mel frequency cepstral coeffi-cients (MFCCs)] and a second one based on articulatory similarity, as measured through electromagnetic articulography (EMA). Our hypothesis is that articulatory features provide a better metric for linguistic similarity across speakers than acoustic features. To test this hypothesis, we recorded an articulatory-acoustic corpus from a native and a nonnative speaker, and
evaluated the two speech representations (acoustic versus articulatory) through a series of perceptual experiments. Formal listening tests indicate that the approach can achieve a 20% reduction in perceived accent, but also reveal a strong coupling between accent and speaker identity. To address this issue, we disguised original and resynthesized utterances by altering their average pitch and normalizing vocal tract length. An additional listening experiment supports the hypothesis that articulatory features are less speaker dependent than acoustic features. |
2011
|
Lee, J; Young, S S; Gutierrez-Osuna, R An Iterative Image Registration Technique Using a Scale-Space Model Technical Report 2011. @techreport{lee2011iterative,
title = {An Iterative Image Registration Technique Using a Scale-Space Model},
author = {J Lee and S S Young and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/lee2011iterative.pdf},
year = {2011},
date = {2011-12-01},
abstract = {Registration between two images is a key problem in computer vision. Current methods tend to separate the scale estimation process from translation and rotation estimation. This is due to the fact that the scale parameter is inherently related to the image resolution. In this paper, we present an area-based image registration technique that can simultaneously estimate translation, rotation, and scale parameters and take into account differences in resolution between two images. We first develop a scale-space model that relates the entire reference image pixels to a single observed image pixel with a scale parameter. This model is then easily generalized to include x-y translation and rotation parameters. By embedding this scale-space model into a non-linear least squares method, we can iteratively estimate the four registration parameters (x-y shift, rotation, and scale) in a unified manner. We test the validity of the proposed method on both simulated and real image data.},
keywords = {Computer vision},
pubstate = {published},
tppubtype = {techreport}
}
Registration between two images is a key problem in computer vision. Current methods tend to separate the scale estimation process from translation and rotation estimation. This is due to the fact that the scale parameter is inherently related to the image resolution. In this paper, we present an area-based image registration technique that can simultaneously estimate translation, rotation, and scale parameters and take into account differences in resolution between two images. We first develop a scale-space model that relates the entire reference image pixels to a single observed image pixel with a scale parameter. This model is then easily generalized to include x-y translation and rotation parameters. By embedding this scale-space model into a non-linear least squares method, we can iteratively estimate the four registration parameters (x-y shift, rotation, and scale) in a unified manner. We test the validity of the proposed method on both simulated and real image data. |
Choi, J; Gutierrez-Osuna, R Removal of respiratory influences from heart rate variability in stress monitoring Journal Article In: IEEE Sensors Journal, vol. 11, no. 11, pp. 2649-2656, 2011. @article{choi2011removal,
title = {Removal of respiratory influences from heart rate variability in stress monitoring},
author = {J Choi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/choi2011removal.pdf},
year = {2011},
date = {2011-01-01},
journal = {IEEE Sensors Journal},
volume = {11},
number = {11},
pages = {2649-2656},
publisher = {IEEE},
abstract = {This paper addresses a major weakness of traditional heart-rate-variability (HRV) analysis for the purpose of monitoring stress: sensitivity to respiratory influences. To address this issue, a linear system-identification model of the cardiorespiratory system using commercial heart rate monitors and respiratory sensors was constructed. Subtraction of respiratory driven fluctuations in heart rate leads to a residual signal where the effects of mental stress become more salient. We experimentally validated the effectiveness of this method on a binary discrimination problem with two conditions: mental stress of subjects performing cognitive tasks and a relaxation condition. In the process, we also propose a normalization method that can be used to compensate for ventilation differences between paced and spontaneous breathing. Our results suggest that, by separating respiration influences, the residual HRV has more discrimination power than traditional HRV analysis for the purpose of monitoring mental stress/load.},
keywords = {Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {article}
}
This paper addresses a major weakness of traditional heart-rate-variability (HRV) analysis for the purpose of monitoring stress: sensitivity to respiratory influences. To address this issue, a linear system-identification model of the cardiorespiratory system using commercial heart rate monitors and respiratory sensors was constructed. Subtraction of respiratory driven fluctuations in heart rate leads to a residual signal where the effects of mental stress become more salient. We experimentally validated the effectiveness of this method on a binary discrimination problem with two conditions: mental stress of subjects performing cognitive tasks and a relaxation condition. In the process, we also propose a normalization method that can be used to compensate for ventilation differences between paced and spontaneous breathing. Our results suggest that, by separating respiration influences, the residual HRV has more discrimination power than traditional HRV analysis for the purpose of monitoring mental stress/load. |
Gutierrez-Osuna, R; Gosangi, R; Hierlemann, A Invited: Advances in Active and Adaptive Chemical Sensing Conference Proceedings of the 14th International Symposium on Olfaction and Electronic Nose, 2011. @conference{gutierrez2011invited,
title = {Invited: Advances in Active and Adaptive Chemical Sensing},
author = {R Gutierrez-Osuna and R Gosangi and A Hierlemann},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2011invited.pdf},
year = {2011},
date = {2011-01-01},
booktitle = {Proceedings of the 14th International Symposium on Olfaction and Electronic Nose},
abstract = {In this presentation, we will review advances at the chemical sensor and data processing levels that may enable the development of adaptive sensors. We will briefly discuss techniques at the sensor and system levels, including modulation of internal parameters (e.g., operating temperatures and absorption wavelengths) and external parameters (e.g., exposure times, preconcentration temperatures). At the signal processing level, we will overview adaptive filtering strategies that may be used to cancel interferences (e.g., environmental variables, drift), adaptive classification techniques for incremental learning in dynamic environments, and active sensing methods for on‐line optimization of sensor arrays and individual tunable sensors. We will also present a methodology based on probabilistic graphical models that may be used to model the dynamic response of metal‐oxide sensors under temperature modulation and select suitable temperature sequences on‐the‐fly, as the sensor interacts with its environment.},
keywords = {Active sensing},
pubstate = {published},
tppubtype = {conference}
}
In this presentation, we will review advances at the chemical sensor and data processing levels that may enable the development of adaptive sensors. We will briefly discuss techniques at the sensor and system levels, including modulation of internal parameters (e.g., operating temperatures and absorption wavelengths) and external parameters (e.g., exposure times, preconcentration temperatures). At the signal processing level, we will overview adaptive filtering strategies that may be used to cancel interferences (e.g., environmental variables, drift), adaptive classification techniques for incremental learning in dynamic environments, and active sensing methods for on‐line optimization of sensor arrays and individual tunable sensors. We will also present a methodology based on probabilistic graphical models that may be used to model the dynamic response of metal‐oxide sensors under temperature modulation and select suitable temperature sequences on‐the‐fly, as the sensor interacts with its environment. |
Gosangi, R; Gutierrez-Osuna, R Quantification of Gas Mixtures with Active Recursive Estimation Conference Proceedings of the 14th International Symposium on Olfaction and Electronic Nose, 2011. @conference{gosangi2011quantification,
title = {Quantification of Gas Mixtures with Active Recursive Estimation},
author = {R Gosangi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gosangi2011quantification.pdf},
year = {2011},
date = {2011-01-01},
booktitle = {Proceedings of the 14th International Symposium on Olfaction and Electronic Nose},
journal = {AIP Conference Proceedings},
pages = {23-24},
abstract = {We present an active‐sensing strategy to estimate the concentrations in a gas mixture using temperature modulation of metal‐oxide (MOX) sensors. The approach is based on recursive Bayesian estimation and uses an information‐theoretic criterion to select operating temperatures on‐the‐fly. Recursive estimation has been widely used in mobile robotics, e.g., for localization purposes. Here, we employ a similar approach to estimate the concentrations of the constituents in a gas mixture. In this formulation, we represent a concentration profile as a discrete state and maintain a ‘belief’ distribution that represents the probability of each state. We employ a Bayes filter to update the belief distribution whenever new sensor measurements arrive, and a mutual‐information criterion to select the next operating temperature. This allows us to optimize the temperature program in real time, as the sensor interacts with its environment. We validate our approach on a simulated dataset generated from temperature modulated responses of a MOX sensor exposed to a mixture of three analytes. The results presented here provide a preliminary proof of concept for an agile approach to quantifying gas mixtures.},
keywords = {Active sensing, Metal-oxide sensors},
pubstate = {published},
tppubtype = {conference}
}
We present an active‐sensing strategy to estimate the concentrations in a gas mixture using temperature modulation of metal‐oxide (MOX) sensors. The approach is based on recursive Bayesian estimation and uses an information‐theoretic criterion to select operating temperatures on‐the‐fly. Recursive estimation has been widely used in mobile robotics, e.g., for localization purposes. Here, we employ a similar approach to estimate the concentrations of the constituents in a gas mixture. In this formulation, we represent a concentration profile as a discrete state and maintain a ‘belief’ distribution that represents the probability of each state. We employ a Bayes filter to update the belief distribution whenever new sensor measurements arrive, and a mutual‐information criterion to select the next operating temperature. This allows us to optimize the temperature program in real time, as the sensor interacts with its environment. We validate our approach on a simulated dataset generated from temperature modulated responses of a MOX sensor exposed to a mixture of three analytes. The results presented here provide a preliminary proof of concept for an agile approach to quantifying gas mixtures. |
Huang, J; Gosangi, R; Gutierrez-Osuna, R Active Sensing with Fabry-Perot Infrared Interferometers Conference Proceedings of the 14th International Symposium on Olfaction and Electronic Nose, 2011. @conference{huang2011active,
title = {Active Sensing with Fabry-Perot Infrared Interferometers},
author = {J Huang and R Gosangi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/huang2011active.pdf},
year = {2011},
date = {2011-01-01},
booktitle = {Proceedings of the 14th International Symposium on Olfaction and Electronic Nose},
journal = {AIP Conference Proceedings},
pages = {31-32},
abstract = {In this article, we describe an active‐sensing framework for infrared (IR) spectroscopy. The goal is to generate a sequence of wavelengths that best discriminates among chemicals. Unlike feature‐selection strategies, the sequence is selected on‐the‐fly as the device acquires data. The framework models the problem as a Partially Observable Markov Decision Process (POMDP), which is solved by a greedy myopic algorithm. In previous work [1], we had applied this framework to temperature‐modulated metal oxide sensor. Here, we adapt the framework to a tunable IR sensor based on Fabry‐Perot interferometers (FPI). FPIs provide a low‐cost alternative to traditional Fourier Transform Infrared Spectroscopy (FTIR), though at the expense of a narrower effective range and lower spectral resolution. Here, we first test whether the framework can scale up to large problems consisting 27 chemicals with 60 dimensions; our previous work on metal oxide sensors employed three chemicals and 7 dimensions. For this purpose, FPI spectra are simulated from FTIR. Then we validate the framework experimentally on 3 chemicals using a prototype instrument based on FPIs. These preliminary results are encouraging and indicate that the framework is able to solve classification problems of reasonable size.},
keywords = {Active sensing, Infrared spectroscopy},
pubstate = {published},
tppubtype = {conference}
}
In this article, we describe an active‐sensing framework for infrared (IR) spectroscopy. The goal is to generate a sequence of wavelengths that best discriminates among chemicals. Unlike feature‐selection strategies, the sequence is selected on‐the‐fly as the device acquires data. The framework models the problem as a Partially Observable Markov Decision Process (POMDP), which is solved by a greedy myopic algorithm. In previous work [1], we had applied this framework to temperature‐modulated metal oxide sensor. Here, we adapt the framework to a tunable IR sensor based on Fabry‐Perot interferometers (FPI). FPIs provide a low‐cost alternative to traditional Fourier Transform Infrared Spectroscopy (FTIR), though at the expense of a narrower effective range and lower spectral resolution. Here, we first test whether the framework can scale up to large problems consisting 27 chemicals with 60 dimensions; our previous work on metal oxide sensors employed three chemicals and 7 dimensions. For this purpose, FPI spectra are simulated from FTIR. Then we validate the framework experimentally on 3 chemicals using a prototype instrument based on FPIs. These preliminary results are encouraging and indicate that the framework is able to solve classification problems of reasonable size. |
Boulos, M N K; Blanchard, B J; Walker, C; Montero, J; Tripathy, A; Gutierrez-Osuna, R Web GIS in practice X: a Microsoft Kinect natural user interface for Google Earth navigation Journal Article In: International Journal of Health Geographics, vol. 10, no. 1, pp. 45, 2011. @article{boulos2011web,
title = {Web GIS in practice X: a Microsoft Kinect natural user interface for Google Earth navigation},
author = {M N K Boulos and B J Blanchard and C Walker and J Montero and A Tripathy and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/boulos2011web.pdf},
year = {2011},
date = {2011-01-01},
journal = {International Journal of Health Geographics},
volume = {10},
number = {1},
pages = {45},
publisher = {BioMed Central Ltd},
abstract = {This paper covers the use of depth sensors such as Microsoft Kinect and ASUS Xtion to provide a natural user interface (NUI) for controlling 3-D (three-dimensional) virtual globes such as Google Earth (including its Street View mode), Bing Maps 3D, and NASA World Wind. The paper introduces the Microsoft Kinect device, briefly describing how it works (the underlying technology by PrimeSense), as well as its market uptake and application potential beyond its original intended purpose as a home entertainment and video game controller. The different software drivers available for connecting the Kinect device to a PC (Personal Computer) are also covered, and their comparative pros and cons briefly discussed. We survey a number of approaches and application examples for controlling 3-D virtual globes using the Kinect sensor, then describe Kinoogle, a Kinect interface for natural interaction with Google Earth, developed by students at Texas A&M University. Readers interested in trying out the application on their own hardware can download a Zip archive (included with the manuscript as additional files 1, 2, & 3) that contains a 'Kinnogle installation package for Windows PCs'. Finally, we discuss some usability aspects of Kinoogle and similar NUIs for controlling 3-D virtual globes (including possible future improvements), and propose a number of unique, practical 'use scenarios' where such NUIs could prove useful in navigating a 3-D virtual globe, compared to conventional mouse/3-D mouse and keyboard-based interfaces.},
keywords = {Gestures},
pubstate = {published},
tppubtype = {article}
}
This paper covers the use of depth sensors such as Microsoft Kinect and ASUS Xtion to provide a natural user interface (NUI) for controlling 3-D (three-dimensional) virtual globes such as Google Earth (including its Street View mode), Bing Maps 3D, and NASA World Wind. The paper introduces the Microsoft Kinect device, briefly describing how it works (the underlying technology by PrimeSense), as well as its market uptake and application potential beyond its original intended purpose as a home entertainment and video game controller. The different software drivers available for connecting the Kinect device to a PC (Personal Computer) are also covered, and their comparative pros and cons briefly discussed. We survey a number of approaches and application examples for controlling 3-D virtual globes using the Kinect sensor, then describe Kinoogle, a Kinect interface for natural interaction with Google Earth, developed by students at Texas A&M University. Readers interested in trying out the application on their own hardware can download a Zip archive (included with the manuscript as additional files 1, 2, & 3) that contains a 'Kinnogle installation package for Windows PCs'. Finally, we discuss some usability aspects of Kinoogle and similar NUIs for controlling 3-D virtual globes (including possible future improvements), and propose a number of unique, practical 'use scenarios' where such NUIs could prove useful in navigating a 3-D virtual globe, compared to conventional mouse/3-D mouse and keyboard-based interfaces. |
Rodriguez, J; Gutierrez-Osuna, R Reverse caricatures effects on three-dimensional facial reconstructions Journal Article In: Image and Vision Computing, vol. 29, no. 5, pp. 329-334, 2011. @article{rodriguez2011reverse,
title = {Reverse caricatures effects on three-dimensional facial reconstructions},
author = {J Rodriguez and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/rodriguez2011reverse.pdf},
year = {2011},
date = {2011-01-01},
journal = {Image and Vision Computing},
volume = {29},
number = {5},
pages = {329-334},
publisher = {Elsevier},
abstract = {Previous research has shown that familiarization with three-dimensional (3D) caricatures can help improve recognition of same-race and other-race faces, a result that may lead to new training tools in security applications. Since 3D facial scans are not generally available, here we sought to determine whether 3D reconstructions from 2D frontal images could be used for the same purpose. Our results suggest that, despite the high level of photographic realism achieved by current 3D facial reconstruction methods, additional research is needed in order to reduce reconstruction errors and capture the distinctive facial traits of an individual.},
keywords = {Face perception},
pubstate = {published},
tppubtype = {article}
}
Previous research has shown that familiarization with three-dimensional (3D) caricatures can help improve recognition of same-race and other-race faces, a result that may lead to new training tools in security applications. Since 3D facial scans are not generally available, here we sought to determine whether 3D reconstructions from 2D frontal images could be used for the same purpose. Our results suggest that, despite the high level of photographic realism achieved by current 3D facial reconstruction methods, additional research is needed in order to reduce reconstruction errors and capture the distinctive facial traits of an individual. |
Shipman, F; Park, S I; Gutierrez-Osuna, R; Choi, J PerCon: Supporting the Management and Reuse of Wearable Sensor Data Technical Report 2011. @techreport{shipman2011percon,
title = {PerCon: Supporting the Management and Reuse of Wearable Sensor Data},
author = {F Shipman and S I Park and R Gutierrez-Osuna and J Choi},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/shipman2011percon.pdf},
year = {2011},
date = {2011-01-01},
abstract = {This paper describes the problem of managing wearable sensor data and the design of an environment to support this activity. We are engaged in studies collecting data from custom‐made and off‐the‐shelf wearable and mobile sensors to explore the impact of context and physiological state on cognitive performance. The data being collected has the potential to assess many potential hypotheses beyond the original hypothesis being explored. In order to achieve this potential, infrastructure is required to manage, access, preserve, and share the various types of digital objects recorded from individual research participants. As with many studies of individuals over time, there are a number of data streams correlated via timestamps for each participant. To manage this data we are developing PerCon. PerCon processes and integrates the individual datasets so as to be loosely coupled with the analysis techniques used in our first stage of research. In addition, PerCon provides services such as searching, indexing, browsing and visualization. PerCon’s APIs support access to and processing of the resources by user and researcher applications. A result of our activity is an initial representation of the relationships among the heterogeneous resources to facilitate their reuse. Longer term, this will be separated into domain‐independent and domaindependent ontologies of the data types and resources involved. The overall result is an architecture and initial instantiation for e‐Science and e‐Health digital libraries.},
keywords = {Health, Wearable sensors},
pubstate = {published},
tppubtype = {techreport}
}
This paper describes the problem of managing wearable sensor data and the design of an environment to support this activity. We are engaged in studies collecting data from custom‐made and off‐the‐shelf wearable and mobile sensors to explore the impact of context and physiological state on cognitive performance. The data being collected has the potential to assess many potential hypotheses beyond the original hypothesis being explored. In order to achieve this potential, infrastructure is required to manage, access, preserve, and share the various types of digital objects recorded from individual research participants. As with many studies of individuals over time, there are a number of data streams correlated via timestamps for each participant. To manage this data we are developing PerCon. PerCon processes and integrates the individual datasets so as to be loosely coupled with the analysis techniques used in our first stage of research. In addition, PerCon provides services such as searching, indexing, browsing and visualization. PerCon’s APIs support access to and processing of the resources by user and researcher applications. A result of our activity is an initial representation of the relationships among the heterogeneous resources to facilitate their reuse. Longer term, this will be separated into domain‐independent and domaindependent ontologies of the data types and resources involved. The overall result is an architecture and initial instantiation for e‐Science and e‐Health digital libraries. |
Gosangi, R; Gutierrez-Osuna, R Data-driven Modeling of Metal-oxide Sensors with Dynamic Bayesian Networks Conference Proceedings of the 14th International Symposium on Olfaction and Electronic Nose, 2011. @conference{gosangi2011data,
title = {Data-driven Modeling of Metal-oxide Sensors with Dynamic Bayesian Networks},
author = {R Gosangi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gosangi2011data.pdf},
year = {2011},
date = {2011-01-01},
booktitle = {Proceedings of the 14th International Symposium on Olfaction and Electronic Nose},
abstract = {We present a data‐driven probabilistic framework to model the transient response of MOX sensors modulated with a sequence of voltage steps. Analytical models of MOX sensors are usually built based on the physico‐chemical properties of the sensing materials. Although building these models provides an insight into the sensor behavior, they also require a thorough understanding of the underlying operating principles. Here we propose a data‐driven approach to characterize the dynamical relationship between sensor inputs and outputs. Namely, we use dynamic Bayesian networks (DBNs), probabilistic models that represent temporal relations between a set of random variables. We identify a set of control variables that influence the sensor responses, create a graphical representation that captures the causal relations between these variables, and finally train the model with experimental data. We validated the approach on experimental data in terms of predictive accuracy and classification performance. Our results show that DBNs can accurately predict the dynamic response of MOX sensors, as well as capture the discriminatory information present in the sensor transients.},
keywords = {Active sensing, Metal-oxide sensors},
pubstate = {published},
tppubtype = {conference}
}
We present a data‐driven probabilistic framework to model the transient response of MOX sensors modulated with a sequence of voltage steps. Analytical models of MOX sensors are usually built based on the physico‐chemical properties of the sensing materials. Although building these models provides an insight into the sensor behavior, they also require a thorough understanding of the underlying operating principles. Here we propose a data‐driven approach to characterize the dynamical relationship between sensor inputs and outputs. Namely, we use dynamic Bayesian networks (DBNs), probabilistic models that represent temporal relations between a set of random variables. We identify a set of control variables that influence the sensor responses, create a graphical representation that captures the causal relations between these variables, and finally train the model with experimental data. We validated the approach on experimental data in terms of predictive accuracy and classification performance. Our results show that DBNs can accurately predict the dynamic response of MOX sensors, as well as capture the discriminatory information present in the sensor transients. |
2010
|
Choi, J; Ahmed, B; Gutierrez-Osuna, R Ambulatory Stress Monitoring with Minimally-Invasive Wearable Sensors Technical Report 2010. @techreport{choi10techreport,
title = {Ambulatory Stress Monitoring with Minimally-Invasive Wearable Sensors},
author = {J Choi and B Ahmed and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/choi2010techreport.pdf},
year = {2010},
date = {2010-11-10},
abstract = {Chronic stress can have serious health consequences, and is a leading risk factor for heart diseases, diabetes, asthma and depression. This article presents a minimally-invasive and wireless wearable sensor platform that can be used to monitor a number of physiological variables known to correlate with stress. We discuss the system design and sensor selection, both of which were guided as a tradeoff between information content and wearability. The platform is thoroughly evaluated through a battery of tests that elicit mental workload and physical activity, as well as through subjective assessments of comfort. Our results indicate that the sensor system is responsive to three broad types of factors: mental workload, posture and physical activity. We also describe a system-identification method that improves detection of mental stress by removing respiratory influences on heart rate.},
keywords = {Electrodermal activity, Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {techreport}
}
Chronic stress can have serious health consequences, and is a leading risk factor for heart diseases, diabetes, asthma and depression. This article presents a minimally-invasive and wireless wearable sensor platform that can be used to monitor a number of physiological variables known to correlate with stress. We discuss the system design and sensor selection, both of which were guided as a tradeoff between information content and wearability. The platform is thoroughly evaluated through a battery of tests that elicit mental workload and physical activity, as well as through subjective assessments of comfort. Our results indicate that the sensor system is responsive to three broad types of factors: mental workload, posture and physical activity. We also describe a system-identification method that improves detection of mental stress by removing respiratory influences on heart rate. |
Felps, D; Gutierrez-Osuna, R Normalization of Articulatory Data through Procrustes Transformations and Analysis-by-synthesis Technical Report 2010. @techreport{felps2010techreport,
title = {Normalization of Articulatory Data through Procrustes Transformations and Analysis-by-synthesis},
author = {D Felps and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/felps2010techreport.pdf},
year = {2010},
date = {2010-05-05},
abstract = {We describe and compare three methods that can be used to normalize articulatory data across speakers. The methods seek to explain systematic anatomical differences between a source and target speaker without modifying the articulatory velocities of the source speaker. The first method is the classical Procrustes transform, which allows for a global translation, rotation, and scaling of articulator positions. An extension to the Procrustes transform is presented that allows independent translations of each articulator. The additional parameters provide a 35% increase in articulatory similarity between two speakers when compared to classical Procrustes. The proposed extension is also coupled with a data-driven articulatory synthesizer to select model parameters that best explain the predicted acoustic (rather than articulatory) differences.},
keywords = {Articulatory synthesis, Speech},
pubstate = {published},
tppubtype = {techreport}
}
We describe and compare three methods that can be used to normalize articulatory data across speakers. The methods seek to explain systematic anatomical differences between a source and target speaker without modifying the articulatory velocities of the source speaker. The first method is the classical Procrustes transform, which allows for a global translation, rotation, and scaling of articulator positions. An extension to the Procrustes transform is presented that allows independent translations of each articulator. The additional parameters provide a 35% increase in articulatory similarity between two speakers when compared to classical Procrustes. The proposed extension is also coupled with a data-driven articulatory synthesizer to select model parameters that best explain the predicted acoustic (rather than articulatory) differences. |
Gutierrez-Osuna, R; Felps, D Foreign Accent Conversion through Voice Morphing Technical Report 2010. @techreport{gutierrez2010techreport,
title = {Foreign Accent Conversion through Voice Morphing},
author = {R Gutierrez-Osuna and D Felps},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2010techreport.pdf},
year = {2010},
date = {2010-05-05},
abstract = {We present a voice morphing strategy that can be used to generate a continuum of accent transformations between a foreign speaker and a native speaker. The approach performs a cepstral decomposition of speech into spectral slope and spectral detail. Accent conversions are then generated by combining the spectral slope of the foreign speaker with a morph of the spectral detail of the native speaker. Spectral morphing is achieved by representing the spectral detail through pulse density modulation and averaging pulses in a pair-wise fashion. The technique is evaluated on parallel recordings from two ARCTIC speakers using objective measures of acoustic quality, speaker identity and foreign accent hat have been recently shown to correlate with perceptual results from listening tests.},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {techreport}
}
We present a voice morphing strategy that can be used to generate a continuum of accent transformations between a foreign speaker and a native speaker. The approach performs a cepstral decomposition of speech into spectral slope and spectral detail. Accent conversions are then generated by combining the spectral slope of the foreign speaker with a morph of the spectral detail of the native speaker. Spectral morphing is achieved by representing the spectral detail through pulse density modulation and averaging pulses in a pair-wise fashion. The technique is evaluated on parallel recordings from two ARCTIC speakers using objective measures of acoustic quality, speaker identity and foreign accent hat have been recently shown to correlate with perceptual results from listening tests. |
Yu, N Y; Yamauchi, T; Yang, H F; Chen, Y L; Gutierrez-Osuna, R Feature selection for inductive generalization Journal Article In: Cognitive science, vol. 34, no. 8, pp. 1574–1593, 2010. @article{yu2010cogsci,
title = {Feature selection for inductive generalization},
author = {N Y Yu and T Yamauchi and H F Yang and Y L Chen and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/yu2010cogsci.pdf},
year = {2010},
date = {2010-01-01},
journal = {Cognitive science},
volume = {34},
number = {8},
pages = {1574--1593},
publisher = {Wiley Online Library},
abstract = {Judging similarities among objects, events, and experiences is one of the most basic cognitive abilities, allowing us to make predictions and generalizations. The main assumption in similarity judgment is that people selectively attend to salient features of stimuli and judge their similarities on the basis of the common and distinct features of the stimuli. However, it is unclear how people select features from stimuli and how they weigh features. Here, we present a computational method that helps address these questions. Our procedure combines image-processing techniques with a machine-learning algorithm and assesses feature weights that can account for both similarity and categorization judgment data. Our analysis suggests that a small number of local features are particularly important to explain our behavioral data.},
keywords = {Face perception},
pubstate = {published},
tppubtype = {article}
}
Judging similarities among objects, events, and experiences is one of the most basic cognitive abilities, allowing us to make predictions and generalizations. The main assumption in similarity judgment is that people selectively attend to salient features of stimuli and judge their similarities on the basis of the common and distinct features of the stimuli. However, it is unclear how people select features from stimuli and how they weigh features. Here, we present a computational method that helps address these questions. Our procedure combines image-processing techniques with a machine-learning algorithm and assesses feature weights that can account for both similarity and categorization judgment data. Our analysis suggests that a small number of local features are particularly important to explain our behavioral data. |
Gosangi, R; Gutierrez-Osuna, R Energy-aware active chemical sensing Conference Proceedings of IEEE Sensors, IEEE 2010. @conference{gosangi2010sensorsc,
title = {Energy-aware active chemical sensing},
author = {R Gosangi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gosangi2010sensorsc.pdf},
year = {2010},
date = {2010-01-01},
booktitle = {Proceedings of IEEE Sensors},
pages = {1094--1099},
organization = {IEEE},
abstract = {We propose an adaptive sensing framework for metal-oxide (MOX) sensors that seeks to minimize energy consumption through temperature modulation. Our approach generates temperature programs by means of an active-sensing strategy combined with an objective function that penalizes power consumption. The problem is modeled as a partially observable Markov decision process (POMDP) and solved with a myopic policy that operates in real time. The policy selects sensing actions (i.e., temperature pulses) that balance misclassification costs (e.g., chemicals identified as the wrong target) and sensing costs (i.e., power consumption). We experimentally validate the method on a ternary chemical discrimination problem, and compare it against a "passive classifier." Our results show that, for a given energy budget, the active-sensing strategy selects temperatures with more discriminatory information than those of the passive classifier by penalizing pulses of higher temperature and longer durations.},
keywords = {Active sensing, Chemical sensors, Metal-oxide sensors, Temperature modulation},
pubstate = {published},
tppubtype = {conference}
}
We propose an adaptive sensing framework for metal-oxide (MOX) sensors that seeks to minimize energy consumption through temperature modulation. Our approach generates temperature programs by means of an active-sensing strategy combined with an objective function that penalizes power consumption. The problem is modeled as a partially observable Markov decision process (POMDP) and solved with a myopic policy that operates in real time. The policy selects sensing actions (i.e., temperature pulses) that balance misclassification costs (e.g., chemicals identified as the wrong target) and sensing costs (i.e., power consumption). We experimentally validate the method on a ternary chemical discrimination problem, and compare it against a "passive classifier." Our results show that, for a given energy budget, the active-sensing strategy selects temperatures with more discriminatory information than those of the passive classifier by penalizing pulses of higher temperature and longer durations. |
Choi, J; Gutierrez-Osuna, R Estimating mental stress using a wearable cardio-respiratory sensor Conference Proceedings of IEEE Sensors, IEEE 2010. @conference{choi2010sensorsc,
title = {Estimating mental stress using a wearable cardio-respiratory sensor},
author = {J Choi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/choi2010sensorsc.pdf},
year = {2010},
date = {2010-01-01},
booktitle = {Proceedings of IEEE Sensors},
pages = {150--154},
organization = {IEEE},
abstract = {This article describes a signal-processing approach to detect mental stress using unobtrusive wearable sensors. The approach addresses a major weakness of traditional methods based on heart-rate-variability (HRV) analysis: sensitivity to respiratory influences. To address this issue, we build a linear model that predicts the effect of breathing on the autonomic nervous system activation, as measured through HRV. Subtraction of respiratory effects leads to a residual signal that provides better discrimination between mental stress and relaxation conditions than traditional HRV tachogram. The method is experimentally validated on a discrimination task with two psycho-physiological conditions: mental stress and relaxation. To illustrate the effectiveness of the method, we impose a pacing respiratory signal that interferes with the main spectral band of the sympathetic branch. Our results suggest that the HRV residual signal has more discrimination power than conventional HRV analysis in the presence of respiration interferences.},
keywords = {Health, Heart rate variability, Stress, Wearable sensors},
pubstate = {published},
tppubtype = {conference}
}
This article describes a signal-processing approach to detect mental stress using unobtrusive wearable sensors. The approach addresses a major weakness of traditional methods based on heart-rate-variability (HRV) analysis: sensitivity to respiratory influences. To address this issue, we build a linear model that predicts the effect of breathing on the autonomic nervous system activation, as measured through HRV. Subtraction of respiratory effects leads to a residual signal that provides better discrimination between mental stress and relaxation conditions than traditional HRV tachogram. The method is experimentally validated on a discrimination task with two psycho-physiological conditions: mental stress and relaxation. To illustrate the effectiveness of the method, we impose a pacing respiratory signal that interferes with the main spectral band of the sympathetic branch. Our results suggest that the HRV residual signal has more discrimination power than conventional HRV analysis in the presence of respiration interferences. |
Gutierrez-Osuna, R; Hierlemann, A Adaptive Microsensor Systems Journal Article In: Annual Review of Analytical Chemistry, vol. 3, pp. 255–276, 2010. @article{gutierrez2010arac,
title = {Adaptive Microsensor Systems},
author = {R Gutierrez-Osuna and A Hierlemann},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2010arac.pdf},
year = {2010},
date = {2010-01-01},
journal = {Annual Review of Analytical Chemistry},
volume = {3},
pages = {255--276},
publisher = {Annual Reviews},
abstract = {We provide a broad review of approaches for developing chemosensor systems whose operating parameters can adapt in response to environmental changes or application needs. Adaptation may take place at the instrumentation level (e.g., tunable sensors) and at the data-analysis level (e.g., adaptive classifiers). We discuss several strategies that provide tunability at the device level: modulation of internal sensing parameters, such as frequencies and operation voltages; variation of external parameters, such as exposure times and catalysts; and development of compact microanalysis systems with multiple tuning options. At the data-analysis level, we consider adaptive filters for change, interference, and drift rejection; pattern classifiers that can adapt to changes in the statistical properties of training data; and active-sensing techniques that can tune sensing parameters in real time. We conclude with a discussion of future opportunities for adaptive sensing in wireless distributed sensor systems.},
keywords = {Active sensing, Chemical sensors},
pubstate = {published},
tppubtype = {article}
}
We provide a broad review of approaches for developing chemosensor systems whose operating parameters can adapt in response to environmental changes or application needs. Adaptation may take place at the instrumentation level (e.g., tunable sensors) and at the data-analysis level (e.g., adaptive classifiers). We discuss several strategies that provide tunability at the device level: modulation of internal sensing parameters, such as frequencies and operation voltages; variation of external parameters, such as exposure times and catalysts; and development of compact microanalysis systems with multiple tuning options. At the data-analysis level, we consider adaptive filters for change, interference, and drift rejection; pattern classifiers that can adapt to changes in the statistical properties of training data; and active-sensing techniques that can tune sensing parameters in real time. We conclude with a discussion of future opportunities for adaptive sensing in wireless distributed sensor systems. |
Felps, D; Gutierrez-Osuna, R Developing objective measures of foreign-accent conversion Journal Article In: Audio, Speech, and Language Processing, IEEE Transactions on, vol. 18, no. 5, pp. 1030–1040, 2010. @article{felps2010talsp,
title = {Developing objective measures of foreign-accent conversion},
author = {D Felps and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/felps2010talsp.pdf},
year = {2010},
date = {2010-01-01},
journal = {Audio, Speech, and Language Processing, IEEE Transactions on},
volume = {18},
number = {5},
pages = {1030--1040},
publisher = {IEEE},
abstract = {Various methods have recently appeared to transform foreign-accented speech into its native-accented counterpart. Evaluation of these accent conversion methods requires extensive listening tests across a number of perceptual dimensions. This article presents three objective measures that may be used to assess the acoustic quality, degree of foreign accent, and speaker identity of accent-converted utterances. Accent conversion generates novel utterances: those of a foreign speaker with a native accent. Therefore, the acoustic quality in accent conversion cannot be evaluated with conventional measures of spectral distortion, which assume that a clean recording of the speech signal is available for comparison. Here we evaluate a single-ended measure of speech quality, lTV -T recommendation P.563 for narrow-band telephony. We also propose a measure of foreign accent that exploits a weakness of automatic speech recognizers: their sensitivity to foreign accents. Namely, we use phoneme-level match scores given by the HTK recognizer trained on a large number of English American speakers to obtain a measure of native accent. Finally, we propose a measure of speaker identity that projects acoustic vectors (e.g., Mel cepstral, F0) onto the linear discriminant that maximizes separability for a given pair of source and target speakers. The three measures are evaluated on a corpus of accent-converted utterances that had been previously rated through perceptual tests. Our results show that the three measures have a high degree of correlation with their corresponding subjective ratings, suggesting that they may be used to accelerate the development of foreign-accent conversion tools. Applications of these measures in the context of computer assisted pronunciation training and voice conversion are also discussed.},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {article}
}
Various methods have recently appeared to transform foreign-accented speech into its native-accented counterpart. Evaluation of these accent conversion methods requires extensive listening tests across a number of perceptual dimensions. This article presents three objective measures that may be used to assess the acoustic quality, degree of foreign accent, and speaker identity of accent-converted utterances. Accent conversion generates novel utterances: those of a foreign speaker with a native accent. Therefore, the acoustic quality in accent conversion cannot be evaluated with conventional measures of spectral distortion, which assume that a clean recording of the speech signal is available for comparison. Here we evaluate a single-ended measure of speech quality, lTV -T recommendation P.563 for narrow-band telephony. We also propose a measure of foreign accent that exploits a weakness of automatic speech recognizers: their sensitivity to foreign accents. Namely, we use phoneme-level match scores given by the HTK recognizer trained on a large number of English American speakers to obtain a measure of native accent. Finally, we propose a measure of speaker identity that projects acoustic vectors (e.g., Mel cepstral, F0) onto the linear discriminant that maximizes separability for a given pair of source and target speakers. The three measures are evaluated on a corpus of accent-converted utterances that had been previously rated through perceptual tests. Our results show that the three measures have a high degree of correlation with their corresponding subjective ratings, suggesting that they may be used to accelerate the development of foreign-accent conversion tools. Applications of these measures in the context of computer assisted pronunciation training and voice conversion are also discussed. |
Gosangi, R; Gutierrez-Osuna, R Active temperature programming for metal-oxide chemoresistors Journal Article In: Sensors Journal, IEEE, vol. 10, no. 6, pp. 1075–1082, 2010. @article{gosangi2010sj,
title = {Active temperature programming for metal-oxide chemoresistors},
author = {R Gosangi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gosangi2010sj-1.pdf},
year = {2010},
date = {2010-01-01},
journal = {Sensors Journal, IEEE},
volume = {10},
number = {6},
pages = {1075--1082},
publisher = {IEEE},
abstract = {Modulating the operating temperature of metal-oxide (MOX) chemical sensors gives rise to gas-specific signatures that
provide a wealth of analytical information. In most cases, the operating temperature is modulated according to a standard waveform (e.g., ramp, sine wave). A few studies have approached the optimization of temperature profiles systematically, but these optimizations are performed offline and cannot adapt to changes in the environment. Here, we present an “active perception” strategy based on Partially Observable Markov Decision Processes (POMDP) that allows the temperature program to be optimized in real time, as the sensor reacts to its environment. We characterize the method on a ternary classification problem using a simulated sensor model subjected to additive Gaussian noise, and compare it against two “passive” approaches, a naïve Bayes classifier and a nearest neighbor classifier. Finally, we validate the method in real time using a Taguchi sensor exposed to three volatile compounds. Our results show that the POMDP outperforms both passive approaches and provides a strategy to balance classification performance and sensing costs.},
keywords = {Active sensing, Chemical sensors, Metal-oxide sensors, Temperature modulation},
pubstate = {published},
tppubtype = {article}
}
Modulating the operating temperature of metal-oxide (MOX) chemical sensors gives rise to gas-specific signatures that
provide a wealth of analytical information. In most cases, the operating temperature is modulated according to a standard waveform (e.g., ramp, sine wave). A few studies have approached the optimization of temperature profiles systematically, but these optimizations are performed offline and cannot adapt to changes in the environment. Here, we present an “active perception” strategy based on Partially Observable Markov Decision Processes (POMDP) that allows the temperature program to be optimized in real time, as the sensor reacts to its environment. We characterize the method on a ternary classification problem using a simulated sensor model subjected to additive Gaussian noise, and compare it against two “passive” approaches, a naïve Bayes classifier and a nearest neighbor classifier. Finally, we validate the method in real time using a Taguchi sensor exposed to three volatile compounds. Our results show that the POMDP outperforms both passive approaches and provides a strategy to balance classification performance and sensing costs. |
Felps, D; Geng, C; Berger, M; Richmond, K; Gutierrez-Osuna, R Relying on critical articulators to estimate vocal tract spectra in an articulatory-acoustic database Conference Interspeech, 2010. @conference{felps2010interspeech,
title = {Relying on critical articulators to estimate vocal tract spectra in an articulatory-acoustic database},
author = {D Felps and C Geng and M Berger and K Richmond and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/felps2010interspeech.pdf},
year = {2010},
date = {2010-01-01},
booktitle = {Interspeech},
abstract = {We present a new phone-dependent feature weighting scheme that can be used to map articulatory configurations (e.g. EMA) onto vocal tract spectra (e.g. MFCC) through table lookup. The approach consists of assigning feature weights according to a feature's ability to predict the acoustic distance between frames. Since an articulator's predictive accuracy is phonedependent (e.g., lip location is a better predictor for bilabial sounds than for palatal sounds), a unique weight vector is found for each phone. Inspection of the weights reveals a correspondence with the expected critical articulators for many phones. The proposed method reduces overall cepstral error by 6% when compared to a uniform weighting scheme. Vowels show the greatest benefit, though improvements occur for 80% of the tested phones.},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {conference}
}
We present a new phone-dependent feature weighting scheme that can be used to map articulatory configurations (e.g. EMA) onto vocal tract spectra (e.g. MFCC) through table lookup. The approach consists of assigning feature weights according to a feature's ability to predict the acoustic distance between frames. Since an articulator's predictive accuracy is phonedependent (e.g., lip location is a better predictor for bilabial sounds than for palatal sounds), a unique weight vector is found for each phone. Inspection of the weights reveals a correspondence with the expected critical articulators for many phones. The proposed method reduces overall cepstral error by 6% when compared to a uniform weighting scheme. Vowels show the greatest benefit, though improvements occur for 80% of the tested phones. |
Gutierrez-Osuna, R Electronic Nose Book Chapter In: SAGE Encyclopedia of Perception, Sage Publications, 2010. @inbook{gutierrez2010chapter,
title = {Electronic Nose},
author = {R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2010chapter.pdf},
year = {2010},
date = {2010-01-01},
booktitle = {SAGE Encyclopedia of Perception},
publisher = {Sage Publications},
abstract = {Across a wide range of applications there is a need to rapidly detect, identify, and quantify complex volatile mixtures. Food manufacturers need to monitor the quality of incoming raw products and evaluate the perceptual properties of their products; environmental agencies seek to regulate the emission of malodors from waste treatment and other industrial plants. Humans readily accomplish these tasks through the sense of smell. Could an instrument be developed to mimic these capabilities? This entry
describes the technology of electronic noses, discusses the challenges associated with mimicking human olfaction, and reviews past and current application areas of electronic noses. },
keywords = {Electronic nose},
pubstate = {published},
tppubtype = {inbook}
}
Across a wide range of applications there is a need to rapidly detect, identify, and quantify complex volatile mixtures. Food manufacturers need to monitor the quality of incoming raw products and evaluate the perceptual properties of their products; environmental agencies seek to regulate the emission of malodors from waste treatment and other industrial plants. Humans readily accomplish these tasks through the sense of smell. Could an instrument be developed to mimic these capabilities? This entry
describes the technology of electronic noses, discusses the challenges associated with mimicking human olfaction, and reviews past and current application areas of electronic noses. |
2009
|
Felps, D; Bortfeld, H; Gutierrez-Osuna, R Foreign accent conversion in computer assisted pronunciation training Journal Article In: Speech communication, vol. 51, no. 10, pp. 920–932, 2009. @article{felps2009foreign,
title = {Foreign accent conversion in computer assisted pronunciation training},
author = {D Felps and H Bortfeld and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/felps2009foreign.pdf},
year = {2009},
date = {2009-01-01},
journal = {Speech communication},
volume = {51},
number = {10},
pages = {920--932},
publisher = {Elsevier},
abstract = {Learners of a second language practice their pronunciation by listening to and imitating utterances from native speakers. Recent research has shown that choosing a well-matched native speaker to imitate can have a positive impact on pronunciation training. Here we propose a voice-transformation technique that can be used to generate the (arguably) ideal voice to imitate: the own voice of the learner with a native accent. Our work extends previous research, which suggests that providing learners with prosodically corrected versions of their utterances can be a suitable form of feedback in computer assisted pronunciation training. Our technique provides a conversion of both prosodic and segmental characteristics by means of a pitch-synchronous decomposition of speech into glottal excitation and spectral envelope. We apply the technique to a corpus containing parallel recordings of foreign-accented and native-accented utterances, and validate the resulting accent conversions through a series of perceptual experiments. Our results indicate that the technique can reduce foreign accentedness without significantly altering the voice quality properties of the foreign speaker. Finally, we propose a pedagogical strategy for integrating accent conversion as a form of behavioral shaping in computer assisted pronunciation training.},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {article}
}
Learners of a second language practice their pronunciation by listening to and imitating utterances from native speakers. Recent research has shown that choosing a well-matched native speaker to imitate can have a positive impact on pronunciation training. Here we propose a voice-transformation technique that can be used to generate the (arguably) ideal voice to imitate: the own voice of the learner with a native accent. Our work extends previous research, which suggests that providing learners with prosodically corrected versions of their utterances can be a suitable form of feedback in computer assisted pronunciation training. Our technique provides a conversion of both prosodic and segmental characteristics by means of a pitch-synchronous decomposition of speech into glottal excitation and spectral envelope. We apply the technique to a corpus containing parallel recordings of foreign-accented and native-accented utterances, and validate the resulting accent conversions through a series of perceptual experiments. Our results indicate that the technique can reduce foreign accentedness without significantly altering the voice quality properties of the foreign speaker. Finally, we propose a pedagogical strategy for integrating accent conversion as a form of behavioral shaping in computer assisted pronunciation training. |
Rodriguez, J; Bortfeld, H; Rudomin, I; Hernandez, B; Gutierrez-Osuna, R The reverse-caricature effect revisited: Familiarization with frontal facial caricatures improves veridical face recognition Journal Article In: Applied cognitive psychology, vol. 23, no. 5, pp. 733–742, 2009. @article{rodriguez2009reverse,
title = {The reverse-caricature effect revisited: Familiarization with frontal facial caricatures improves veridical face recognition},
author = {J Rodriguez and H Bortfeld and I Rudomin and B Hernandez and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/rodriguez2009reverse.pdf},
year = {2009},
date = {2009-01-01},
journal = {Applied cognitive psychology},
volume = {23},
number = {5},
pages = {733--742},
publisher = {Wiley Online Library},
abstract = {Prior research suggests that recognition of a person's face can be facilitated by exaggerating the distinctive features of the face during training. We tested if this ‘reverse-caricature effect’ would be robust to procedural variations that created more difficult learning environments. Specifically, we examined whether the effect would emerge with frontal rather than three-quarter views, after very brief exposure to caricatures during the learning phase and after modest rotations of faces during the recognition phase. Results indicate that, even under these difficult training conditions, people are more accurate at recognizing unaltered faces if they are first familiarized with caricatures of the faces, rather than with the unaltered faces. These findings support the development of new training methods to improve face recognition.},
keywords = {Face perception},
pubstate = {published},
tppubtype = {article}
}
Prior research suggests that recognition of a person's face can be facilitated by exaggerating the distinctive features of the face during training. We tested if this ‘reverse-caricature effect’ would be robust to procedural variations that created more difficult learning environments. Specifically, we examined whether the effect would emerge with frontal rather than three-quarter views, after very brief exposure to caricatures during the learning phase and after modest rotations of faces during the recognition phase. Results indicate that, even under these difficult training conditions, people are more accurate at recognizing unaltered faces if they are first familiarized with caricatures of the faces, rather than with the unaltered faces. These findings support the development of new training methods to improve face recognition. |
Choi, J; Gutierrez-Osuna, R Using heart rate monitors to detect mental stress Conference Sixth International Workshop on Wearable and Implantable Body Sensor Networks, IEEE 2009. @conference{choi2009using,
title = {Using heart rate monitors to detect mental stress},
author = {J Choi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/choi2009using.pdf},
year = {2009},
date = {2009-01-01},
booktitle = {Sixth International Workshop on Wearable and Implantable Body Sensor Networks},
pages = {219--223},
organization = {IEEE},
abstract = {This article describes an approach to detecting mental stress using unobtrusive wearable sensors. The approach relies on estimating the state of the autonomic nervous system from an analysis of heart rate variability. Namely, we use a non-linear system identification technique known as principal dynamic modes (PDM) to predict the activation level of the two autonomic branches: sympathetic (i.e. stress-inducing) and parasympathetic (i.e. relaxation-related). We validate the method on a discrimination problem with two psychophysiological conditions, one associated with mental tasks and one induced by relaxation exercises. Our results indicate that PDM features are more stable and less subject-dependent than spectral features, though the latter provide higher classification performance within subjects. When PDM and spectral features are combined, our system discriminates stressful events with a success rate of 83% within subjects (69% between subjects).},
keywords = {Stress, Wearable sensors},
pubstate = {published},
tppubtype = {conference}
}
This article describes an approach to detecting mental stress using unobtrusive wearable sensors. The approach relies on estimating the state of the autonomic nervous system from an analysis of heart rate variability. Namely, we use a non-linear system identification technique known as principal dynamic modes (PDM) to predict the activation level of the two autonomic branches: sympathetic (i.e. stress-inducing) and parasympathetic (i.e. relaxation-related). We validate the method on a discrimination problem with two psychophysiological conditions, one associated with mental tasks and one induced by relaxation exercises. Our results indicate that PDM features are more stable and less subject-dependent than spectral features, though the latter provide higher classification performance within subjects. When PDM and spectral features are combined, our system discriminates stressful events with a success rate of 83% within subjects (69% between subjects). |
Gosangi, R; Gutierrez-Osuna, R Active chemical sensing with partially observable Markov decision processes Conference Proceedings of 13th International Symposium on Olfaction and Electronic Noses, 2009. @conference{gosangi2009active,
title = {Active chemical sensing with partially observable Markov decision processes},
author = {R Gosangi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gosangi2009active.pdf},
year = {2009},
date = {2009-01-01},
booktitle = {Proceedings of 13th International Symposium on Olfaction and Electronic Noses},
abstract = {We present an active‐perception strategy to optimize the temperature program of metal‐oxide sensors in real time, as the sensor reacts with its environment. We model the problem as a partially observable Markov decision process (POMDP), where actions correspond to measurements at particular temperatures, and the agent is to find a temperature sequence that minimizes the Bayes risk. We validate the method on a binary classification problem with a simulated sensor. Our results show that the method provides a balance between classification rate and sensing costs.},
keywords = {Active sensing},
pubstate = {published},
tppubtype = {conference}
}
We present an active‐perception strategy to optimize the temperature program of metal‐oxide sensors in real time, as the sensor reacts with its environment. We model the problem as a partially observable Markov decision process (POMDP), where actions correspond to measurements at particular temperatures, and the agent is to find a temperature sequence that minimizes the Bayes risk. We validate the method on a binary classification problem with a simulated sensor. Our results show that the method provides a balance between classification rate and sensing costs. |
Pazarloglou, A; George, S; Stoleru, R; Gutierrez-Osuna, R Demo abstract: Signal reconstruction with subnyquist sampling using wireless sensor networks Conference International Conference on Information Processing in Sensor Networks, IEEE 2009. @conference{pazarloglou2009demo,
title = {Demo abstract: Signal reconstruction with subnyquist sampling using wireless sensor networks},
author = {A Pazarloglou and S George and R Stoleru and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/pazarloglou2009demo.pdf},
year = {2009},
date = {2009-01-01},
booktitle = {International Conference on Information Processing in Sensor Networks},
pages = {423--424},
organization = {IEEE},
abstract = {Data streaming for sensor networks is an emerging class of application that can offer significant safety and utility enhancements in a number of critical environments. In one such application, disaster response, a wireless sensor network may assist in the detection of living victims trapped in collapsed buildings. As a step towards this goal, this paper addresses the very high bandwidth and processing requirements posed by streaming applications, and demonstrates a sub-Nyquist sampling procedure for reconstructing higher-resolution speech signals.},
keywords = {Other},
pubstate = {published},
tppubtype = {conference}
}
Data streaming for sensor networks is an emerging class of application that can offer significant safety and utility enhancements in a number of critical environments. In one such application, disaster response, a wireless sensor network may assist in the detection of living victims trapped in collapsed buildings. As a step towards this goal, this paper addresses the very high bandwidth and processing requirements posed by streaming applications, and demonstrates a sub-Nyquist sampling procedure for reconstructing higher-resolution speech signals. |
Pazarloglou, A; Stoleru, R; Gutierrez-Osuna, R High-resolution speech signal reconstruction in wireless sensor networks Conference Consumer Communications and Networking Conference, IEEE 2009. @conference{pazarloglou2009high,
title = {High-resolution speech signal reconstruction in wireless sensor networks},
author = {A Pazarloglou and R Stoleru and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/pazarloglou2009high.pdf},
year = {2009},
date = {2009-01-01},
booktitle = {Consumer Communications and Networking Conference},
pages = {1--5},
organization = {IEEE},
abstract = {Data streaming is an emerging class of applications for sensor networks that has very high bandwidth and processing power requirements. In this paper, a new approach for speech data streaming is proposed, which is based on a distributed scheme. This scheme focuses on balancing the energy consumption among nodes in a sensor network by allowing low- resolution streams from multiple nodes to be fused at a central processing node in order to produce an enhanced resolution speech signal. Simulations and experimental results with real microphone signals are presented.},
keywords = {Speech},
pubstate = {published},
tppubtype = {conference}
}
Data streaming is an emerging class of applications for sensor networks that has very high bandwidth and processing power requirements. In this paper, a new approach for speech data streaming is proposed, which is based on a distributed scheme. This scheme focuses on balancing the energy consumption among nodes in a sensor network by allowing low- resolution streams from multiple nodes to be fused at a central processing node in order to produce an enhanced resolution speech signal. Simulations and experimental results with real microphone signals are presented. |
Raman, B; Gutierrez-Osuna, R Relating sensor responses of odorants to their organoleptic properties by means of a biologically-inspired model of receptor neuron convergence onto olfactory bulb Book Chapter In: Biologically inspired signal processing for chemical sensing, pp. 93–108, Springer Berlin/Heidelberg, 2009. @inbook{raman2009relating,
title = {Relating sensor responses of odorants to their organoleptic properties by means of a biologically-inspired model of receptor neuron convergence onto olfactory bulb},
author = {B Raman and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/raman2009relating.pdf},
year = {2009},
date = {2009-01-01},
booktitle = {Biologically inspired signal processing for chemical sensing},
pages = {93--108},
publisher = {Springer Berlin/Heidelberg},
abstract = {This volume presents a collection of research advances in biologically inspired signal processing for chemical sensing. The olfactory system, and the gustatory system to a minor extent, has been taken in the last decades as a source of inspiration to develop artificial sensing systems. The performance of this biological system outperforms in many aspects that of their artificial counterpart. Thus, the goal of researchers in this field is to understand and capture those features that make the olfactory system especially suited for the processing of chemical information. The recognition of odors by the olfactory system entails a number of signal processing functions such as preprocessing, dimensionality reduction, contrast enhancement, and classification. Using mathematical models to mimic the architecture of the olfactory system, these processing functions can be applied to chemical sensor signals. This book provides some background on the olfactory system including a review on information processing in the insect olfactory system along with a proposed signal processing architecture based on the mammalian cortex. It also provides some bio-inspired approaches to process chemical sensor signals such as an olfactory mucosa to improve odor separation and a model of olfactory receptor neuron convergence to correlate sensor responses to an odor and his organoleptic properties.},
keywords = {Neuromorphic models},
pubstate = {published},
tppubtype = {inbook}
}
This volume presents a collection of research advances in biologically inspired signal processing for chemical sensing. The olfactory system, and the gustatory system to a minor extent, has been taken in the last decades as a source of inspiration to develop artificial sensing systems. The performance of this biological system outperforms in many aspects that of their artificial counterpart. Thus, the goal of researchers in this field is to understand and capture those features that make the olfactory system especially suited for the processing of chemical information. The recognition of odors by the olfactory system entails a number of signal processing functions such as preprocessing, dimensionality reduction, contrast enhancement, and classification. Using mathematical models to mimic the architecture of the olfactory system, these processing functions can be applied to chemical sensor signals. This book provides some background on the olfactory system including a review on information processing in the insect olfactory system along with a proposed signal processing architecture based on the mammalian cortex. It also provides some bio-inspired approaches to process chemical sensor signals such as an olfactory mucosa to improve odor separation and a model of olfactory receptor neuron convergence to correlate sensor responses to an odor and his organoleptic properties. |
Yu, N Y; Yamauchi, T; Gutierrez-Osuna, R Similarity perception of visual objects: A machine-learning approach Conference Proceedings of International Conference on Asia Pacific Psychology, 2009. @conference{yu2009similarity,
title = {Similarity perception of visual objects: A machine-learning approach},
author = {N Y Yu and T Yamauchi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/yu2009similarity.pdf},
year = {2009},
date = {2009-01-01},
booktitle = {Proceedings of International Conference on Asia Pacific Psychology},
keywords = {Face perception},
pubstate = {published},
tppubtype = {conference}
}
|
2008
|
Yamanaka, T; Gutierrez-Osuna, R Extracting functional clusters of glomeruli in rat olfactory bulb by non-negative matrix factorization Technical Report 2008. @techreport{yamanaka08extracting,
title = {Extracting functional clusters of glomeruli in rat olfactory bulb by non-negative matrix factorization},
author = {T Yamanaka and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/yamanaka08extracting.pdf},
year = {2008},
date = {2008-11-17},
abstract = {Ensemble coding in the early olfactory pathway has been extensively investigated using imaging techniques. These studies have shown that glomeruli with similar affinity gather in close proximity in olfactory bulb, forming a module. In this work, we propose computational methods for analyzing this neural code. Specifically, we show how non-negative matrix factorization (NMF), a machine-learning method for extracting the intrinsic parts of objects, can be used to automatically extract glomerular modules from a database of bulbar activity patterns, as measured with 2-deoxyglucose. The modules extracted by NMF correspond to localized areas in olfactory bulb, in consistency with experimental results from imaging studies on glomerular activity. To validate the emerging representation, we analyzed the relationship between neural activity on these modules and perceptual descriptions of the odorants. We first used pattern-classification techniques to predict ten perceptual descriptors for 53 odorants from their activity on the modules. Our results indicate that NMF is able to extract modules that are intrinsic to the odor coding mechanism. Furthermore, we used mutual information to analyze the relationship between modules and olfactory perception. This analysis revealed the contribution of each module to the olfactory percepts.},
keywords = {Olfaction},
pubstate = {published},
tppubtype = {techreport}
}
Ensemble coding in the early olfactory pathway has been extensively investigated using imaging techniques. These studies have shown that glomeruli with similar affinity gather in close proximity in olfactory bulb, forming a module. In this work, we propose computational methods for analyzing this neural code. Specifically, we show how non-negative matrix factorization (NMF), a machine-learning method for extracting the intrinsic parts of objects, can be used to automatically extract glomerular modules from a database of bulbar activity patterns, as measured with 2-deoxyglucose. The modules extracted by NMF correspond to localized areas in olfactory bulb, in consistency with experimental results from imaging studies on glomerular activity. To validate the emerging representation, we analyzed the relationship between neural activity on these modules and perceptual descriptions of the odorants. We first used pattern-classification techniques to predict ten perceptual descriptors for 53 odorants from their activity on the modules. Our results indicate that NMF is able to extract modules that are intrinsic to the odor coding mechanism. Furthermore, we used mutual information to analyze the relationship between modules and olfactory perception. This analysis revealed the contribution of each module to the olfactory percepts. |
Yamanaka, T; Perera-Lluna, A; Raman, B; Gutierrez-Galvez, A; Gutierrez-Osuna, R Learning Sparse Basis Vectors in Small-Sample Datasets through Regularized Non-Negative Matrix Factorization Technical Report 2008. @techreport{yamanaka08learning,
title = {Learning Sparse Basis Vectors in Small-Sample Datasets through Regularized Non-Negative Matrix Factorization},
author = {T Yamanaka and A Perera-Lluna and B Raman and A Gutierrez-Galvez and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/yamanaka08learning.pdf},
year = {2008},
date = {2008-07-16},
abstract = {This article presents a novel dimensionality-reduction technique, Regularized Non-negative Matrix Factorization (RNMF), which combines the non-negativity constraint of NMF with a regularization term. In contrast with NMF, which degrades to holistic representations with decreasing amount of data, RNMF is able to extract parts of objects even in the small-sample case.},
keywords = {Face perception},
pubstate = {published},
tppubtype = {techreport}
}
This article presents a novel dimensionality-reduction technique, Regularized Non-negative Matrix Factorization (RNMF), which combines the non-negativity constraint of NMF with a regularization term. In contrast with NMF, which degrades to holistic representations with decreasing amount of data, RNMF is able to extract parts of objects even in the small-sample case. |
Choi, J; Gutierrez-Osuna, R Estimating the principal dynamic modes of autonomic state with wearable sensors Technical Report 2008. @techreport{choi08estimating,
title = {Estimating the principal dynamic modes of autonomic state with wearable sensors},
author = {J Choi and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/choi08estimating.pdf},
year = {2008},
date = {2008-07-16},
abstract = {The relationship between the autonomic nervous system and the heart provides a window into our internal state, e.g., stressed vs. relaxed. This relationship has received extensive attention in cardiovascular physiology, typically with electrocardiogram recordings under laboratory conditions (e.g., pharmacological blockade). This article presents a signal-processing method to estimate autonomic activation using heart-rate monitors under more naturalistic conditions. The method uses non-linear system identification and eigen-analysis to decouple contributions from the two autonomic branches (i.e., sympathetic and parasympathetic). We validate the method using experimental data from a wearable sensor platform that we have designed for experience sampling. Using a discrimination test between two physiological conditions (supine and tilt), we show that our method outperforms traditional techniques based on spectral analysis of heart rate variability.},
keywords = {Wearable sensors},
pubstate = {published},
tppubtype = {techreport}
}
The relationship between the autonomic nervous system and the heart provides a window into our internal state, e.g., stressed vs. relaxed. This relationship has received extensive attention in cardiovascular physiology, typically with electrocardiogram recordings under laboratory conditions (e.g., pharmacological blockade). This article presents a signal-processing method to estimate autonomic activation using heart-rate monitors under more naturalistic conditions. The method uses non-linear system identification and eigen-analysis to decouple contributions from the two autonomic branches (i.e., sympathetic and parasympathetic). We validate the method using experimental data from a wearable sensor platform that we have designed for experience sampling. Using a discrimination test between two physiological conditions (supine and tilt), we show that our method outperforms traditional techniques based on spectral analysis of heart rate variability. |
Felps, D; Bortfeld, H; Gutierrez-Osuna, R Prosodic and segmental factors in foreign-accent conversion Technical Report 2008. @techreport{felps08prosodic,
title = {Prosodic and segmental factors in foreign-accent conversion},
author = {D Felps and H Bortfeld and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/felps08prosodic.pdf},
year = {2008},
date = {2008-07-11},
abstract = {We propose a signal processing method that transforms foreign-accented speech to resemble its native-accented counterpart. The problem is closely related to voice conversion, except that our method seeks to preserve the organic properties of the foreign speaker’s voice; i.e., only those features which cue foreign-accentedness are to be transformed. Our method operates at two levels: prosodic and segmental. Prosodic transformation is performed by means of time and pitch scaling. Segmental transformation is performed by convolving the foreign speaker’s excitation with the warped spectral envelope of the native speaker. Perceptual results indicate that our model is able to provide a 63% reduction in foreign-accentedness. Multidimensional scaling also shows that the segmental transformation causes the perception of a new speaker to emerge, though the identity of this new speaker is three times closer to the foreign speaker than to the native speaker.},
keywords = {Accent conversion, Speech},
pubstate = {published},
tppubtype = {techreport}
}
We propose a signal processing method that transforms foreign-accented speech to resemble its native-accented counterpart. The problem is closely related to voice conversion, except that our method seeks to preserve the organic properties of the foreign speaker’s voice; i.e., only those features which cue foreign-accentedness are to be transformed. Our method operates at two levels: prosodic and segmental. Prosodic transformation is performed by means of time and pitch scaling. Segmental transformation is performed by convolving the foreign speaker’s excitation with the warped spectral envelope of the native speaker. Perceptual results indicate that our model is able to provide a 63% reduction in foreign-accentedness. Multidimensional scaling also shows that the segmental transformation causes the perception of a new speaker to emerge, though the identity of this new speaker is three times closer to the foreign speaker than to the native speaker. |
Choi, H; Gutierrez-Osuna, R; Choi, S; Choe, Y Kernel oriented discriminant analysis for speaker-independent phoneme spaces Conference International Conference on Pattern Recognition, IEEE 2008. @conference{choi2008kernel,
title = {Kernel oriented discriminant analysis for speaker-independent phoneme spaces},
author = {H Choi and R Gutierrez-Osuna and S Choi and Y Choe},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/choi2008kernel.pdf},
year = {2008},
date = {2008-01-01},
booktitle = {International Conference on Pattern Recognition},
pages = {1--4},
organization = {IEEE},
abstract = {Speaker independent feature extraction is a critical problem in speech recognition. Oriented principal component analysis (OPCA) is a potential solution that can find a subspace robust against noise of the data set. The objective of this paper is to find a speaker-independent subspace by generalizing OPCA in two steps: First, we find a nonlinear subspace with the help of a kernel trick, which we refer to as kernel OPCA. Second, we generalize OPCA to problems with more than two phonemes, which leads to oriented discriminant analysis (ODA). In addition, we equip ODA with the kernel trick again, which we refer to as kernel ODA. The models are tested on the CMU ARCTIC speech database. Our results indicate that our proposed kernel methods can outperform linear OPCA and linear ODA at finding a speaker-independent phoneme space.},
keywords = {Speech},
pubstate = {published},
tppubtype = {conference}
}
Speaker independent feature extraction is a critical problem in speech recognition. Oriented principal component analysis (OPCA) is a potential solution that can find a subspace robust against noise of the data set. The objective of this paper is to find a speaker-independent subspace by generalizing OPCA in two steps: First, we find a nonlinear subspace with the help of a kernel trick, which we refer to as kernel OPCA. Second, we generalize OPCA to problems with more than two phonemes, which leads to oriented discriminant analysis (ODA). In addition, we equip ODA with the kernel trick again, which we refer to as kernel ODA. The models are tested on the CMU ARCTIC speech database. Our results indicate that our proposed kernel methods can outperform linear OPCA and linear ODA at finding a speaker-independent phoneme space. |
Rodriguez, J; Bortfeld, H; Gutierrez-Osuna, R Reducing the other-race effect through caricatures Conference IEEE International Conference on Automatic Face & Gesture Recognition, IEEE 2008. @conference{rodriguez2008reducing,
title = {Reducing the other-race effect through caricatures},
author = {J Rodriguez and H Bortfeld and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/rodriguez2008reducing.pdf},
year = {2008},
date = {2008-01-01},
booktitle = {IEEE International Conference on Automatic Face & Gesture Recognition},
pages = {1--5},
organization = {IEEE},
abstract = {We recognize faces from our own race better than those from another race. Although the relative contribution of different mechanisms (e.g. contact vs. attention) remains elusive, it is generally agreed that the other-race effect results from the fact that discriminatory facial features are race-dependent. Previous research has also shown that facial recognition improves when viewers are first familiarized with faces whose most distinctive features have been caricaturized. In this study, we sought to determine the extent to which familiarization with caricaturized faces could also be used to reduce other-race effects. Using an old/new face recognition paradigm, Caucasian subjects were first familiarized with a set of faces from multiple races, and then asked to recognize those faces among a set of confounders. Participants who were familiarized with and then asked to recognize veridical versions of the faces showed a significant other-race effect on Indian faces. In contrast, participants who were familiarized with caricaturized versions of the same faces, and then asked to recognize their veridical versions, showed no other-race effects on Indian faces. This result suggests that caricaturization may be used to help individuals focus their attention to features that are useful for recognition of other-race faces.},
keywords = {Face perception},
pubstate = {published},
tppubtype = {conference}
}
We recognize faces from our own race better than those from another race. Although the relative contribution of different mechanisms (e.g. contact vs. attention) remains elusive, it is generally agreed that the other-race effect results from the fact that discriminatory facial features are race-dependent. Previous research has also shown that facial recognition improves when viewers are first familiarized with faces whose most distinctive features have been caricaturized. In this study, we sought to determine the extent to which familiarization with caricaturized faces could also be used to reduce other-race effects. Using an old/new face recognition paradigm, Caucasian subjects were first familiarized with a set of faces from multiple races, and then asked to recognize those faces among a set of confounders. Participants who were familiarized with and then asked to recognize veridical versions of the faces showed a significant other-race effect on Indian faces. In contrast, participants who were familiarized with caricaturized versions of the same faces, and then asked to recognize their veridical versions, showed no other-race effects on Indian faces. This result suggests that caricaturization may be used to help individuals focus their attention to features that are useful for recognition of other-race faces. |
Paulson, B; Rajan, P; Davalos, P; Gutierrez-Osuna, R; Hammond, T What!?! no Rubine features?: using geometric-based features to produce normalized confidence values for sketch recognition Conference HCC Workshop: Sketch Tools for Diagramming, 2008. @conference{paulson2008no,
title = {What!?! no Rubine features?: using geometric-based features to produce normalized confidence values for sketch recognition},
author = {B Paulson and P Rajan and P Davalos and R Gutierrez-Osuna and T Hammond},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/paulson2008no.pdf},
year = {2008},
date = {2008-01-01},
booktitle = {HCC Workshop: Sketch Tools for Diagramming},
pages = {57--63},
abstract = {As pen-based interfaces become more popular in today’s applications, the need for algorithms to accurately recognize hand-drawn sketches and shapes has increased. In many cases, complex shapes can be constructed hierarchically as a combination of smaller primitive shapes meeting certain geometric constraints.However, in order to construct higher level shapes, it is imperative to accurately recognize the lower-level primitives. Two approaches have become widespread in the sketch recognition field for recognizing lower-level primitives: gesture-based recognition and geometric-based recognition. Our goal is to use a hybrid approach that combines features from both traditional gesture based recognition systems and geometric-based recognition systems. In this paper, we show that we can produce a system with high recognition rates while providing the added benefit of being able to produce normalized confidence values for alternative interpretations;something most geometric-based recognizers lack. Moresignificantly, results from feature subset selection indicate that geometric features aid the recognition process more than gesture-based features when given naturally sketched data.},
keywords = {Gestures},
pubstate = {published},
tppubtype = {conference}
}
As pen-based interfaces become more popular in today’s applications, the need for algorithms to accurately recognize hand-drawn sketches and shapes has increased. In many cases, complex shapes can be constructed hierarchically as a combination of smaller primitive shapes meeting certain geometric constraints.However, in order to construct higher level shapes, it is imperative to accurately recognize the lower-level primitives. Two approaches have become widespread in the sketch recognition field for recognizing lower-level primitives: gesture-based recognition and geometric-based recognition. Our goal is to use a hybrid approach that combines features from both traditional gesture based recognition systems and geometric-based recognition systems. In this paper, we show that we can produce a system with high recognition rates while providing the added benefit of being able to produce normalized confidence values for alternative interpretations;something most geometric-based recognizers lack. Moresignificantly, results from feature subset selection indicate that geometric features aid the recognition process more than gesture-based features when given naturally sketched data. |
Hierlemann, A; Gutierrez-Osuna, R Higher-order chemical sensing Journal Article In: Chemical reviews, vol. 108, no. 2, pp. 563, 2008. @article{hierlemann2008higher,
title = {Higher-order chemical sensing},
author = {A Hierlemann and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/hierlemann2008higher.pdf},
year = {2008},
date = {2008-01-01},
journal = {Chemical reviews},
volume = {108},
number = {2},
pages = {563},
keywords = {Active sensing, Chemical sensors},
pubstate = {published},
tppubtype = {article}
}
|
Yu, N Y; Yamauchi, T; Yang, H F; Chen, Y L; Gutierrez-Osuna, R A Computational Method to Find Salient Features Conference Proceedings of the 6th International Conference of Cognitive Science, 2008. @conference{yu2008Salient,
title = {A Computational Method to Find Salient Features},
author = {N Y Yu and T Yamauchi and H F Yang and Y L Chen and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/yu2008Salient.pdf},
year = {2008},
date = {2008-01-01},
booktitle = {Proceedings of the 6th International Conference of Cognitive Science},
abstract = {Although it is well known that people selectively attend to salient features in similarity judgment, no clear method of identifying “salient features” has been proposed. In this study, we present a new computational technique to identify salient features. First, we collected behavioral data from human participants, and this data was simulated with machine learning techniques, which determined optimal allocations of weights of candidate features. Results revealed image-specific sets of salient features for similarity perception, and suggested that people exaggerate differences between features while computing similarity.},
keywords = {Face perception},
pubstate = {published},
tppubtype = {conference}
}
Although it is well known that people selectively attend to salient features in similarity judgment, no clear method of identifying “salient features” has been proposed. In this study, we present a new computational technique to identify salient features. First, we collected behavioral data from human participants, and this data was simulated with machine learning techniques, which determined optimal allocations of weights of candidate features. Results revealed image-specific sets of salient features for similarity perception, and suggested that people exaggerate differences between features while computing similarity. |
2007
|
Koh, E; Caruso, D; Kerne, A; Gutierrez-Osuna, R Elimination of junk document surrogate candidates through pattern recognition Conference Proceedings of the 2007 ACM symposium on Document engineering, ACM 2007. @conference{koh2007elimination,
title = {Elimination of junk document surrogate candidates through pattern recognition},
author = {E Koh and D Caruso and A Kerne and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/koh2007elimination.pdf},
year = {2007},
date = {2007-01-01},
booktitle = {Proceedings of the 2007 ACM symposium on Document engineering},
pages = {187--195},
organization = {ACM},
abstract = {A surrogate is an object that stands for a document and enables navigation to that document. Hypermedia is often represented with textual surrogates, even though studies have shown that image and text surrogates facilitate the formation of mental models and overall understanding. Surrogates may be formed by breaking a document down into a set of smaller elements, each of which is a surrogate candidate. While processing these surrogate candidates from an HTML document, relevant information may appear together with less useful junk material, such as navigation bars and advertisements.
This paper develops a pattern recognition based approach for eliminating junk while building the set of surrogate candidates. The approach defines features on candidate elements, and uses classification algorithms to make selection decisions based on these features. For the purpose of defining features in surrogate candidates, we introduce the Document Surrogate Model (DSM), a streamlined Document Object Model (DOM)-like representation of semantic structure. Using a quadratic classifier, we were able to eliminate junk surrogate candidates with an average classification rate of 80%. By using this technique, semiautonomous agents can be developed to more effectively generate surrogate collections for users. We end by describing a new approach for hypermedia and the semantic web, which uses the DSM to define value-added surrogates for a document.},
keywords = {Pattern recognition},
pubstate = {published},
tppubtype = {conference}
}
A surrogate is an object that stands for a document and enables navigation to that document. Hypermedia is often represented with textual surrogates, even though studies have shown that image and text surrogates facilitate the formation of mental models and overall understanding. Surrogates may be formed by breaking a document down into a set of smaller elements, each of which is a surrogate candidate. While processing these surrogate candidates from an HTML document, relevant information may appear together with less useful junk material, such as navigation bars and advertisements.
This paper develops a pattern recognition based approach for eliminating junk while building the set of surrogate candidates. The approach defines features on candidate elements, and uses classification algorithms to make selection decisions based on these features. For the purpose of defining features in surrogate candidates, we introduce the Document Surrogate Model (DSM), a streamlined Document Object Model (DOM)-like representation of semantic structure. Using a quadratic classifier, we were able to eliminate junk surrogate candidates with an average classification rate of 80%. By using this technique, semiautonomous agents can be developed to more effectively generate surrogate collections for users. We end by describing a new approach for hypermedia and the semantic web, which uses the DSM to define value-added surrogates for a document. |
Nogueira, F G; Felps, D; Gutierrez-Osuna, R Development of an infrared absorption spectroscope based on linear variable filters Journal Article In: Sensors Journal, IEEE, vol. 7, no. 8, pp. 1183–1190, 2007. @article{nogueira2007development,
title = {Development of an infrared absorption spectroscope based on linear variable filters},
author = {F G Nogueira and D Felps and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/nogueira2007development.pdf},
year = {2007},
date = {2007-01-01},
journal = {Sensors Journal, IEEE},
volume = {7},
number = {8},
pages = {1183--1190},
publisher = {IEEE},
abstract = {The objective of this research is to develop a low-cost infrared absorption spectroscope based on linear variable filter technology for the automated detection of concentrated gases and vapors, and the semiautomated detection of liquids. This instrument represents an alternative to electronic-nose devices based on cross-selective gas sensor arrays. Instead, the proposed instrument uses the concept of computational ldquopseudosensors,rdquo whereby spectral lines in an analytical instrument are clustered into groups and used as independent variables. We characterize the system on a database of chemical mixtures, and evaluate it on two real-world applications in the foodstuffs domain: oil adulteration and trans-fatty acid detection. Our results show that the proposed system is a viable low-resolution, low-cost analytical technique for niche applications.},
keywords = {Infrared spectroscopy},
pubstate = {published},
tppubtype = {article}
}
The objective of this research is to develop a low-cost infrared absorption spectroscope based on linear variable filter technology for the automated detection of concentrated gases and vapors, and the semiautomated detection of liquids. This instrument represents an alternative to electronic-nose devices based on cross-selective gas sensor arrays. Instead, the proposed instrument uses the concept of computational ldquopseudosensors,rdquo whereby spectral lines in an analytical instrument are clustered into groups and used as independent variables. We characterize the system on a database of chemical mixtures, and evaluate it on two real-world applications in the foodstuffs domain: oil adulteration and trans-fatty acid detection. Our results show that the proposed system is a viable low-resolution, low-cost analytical technique for niche applications. |
Raman, B; Kotseroglou, T; Clark, L; Lebl, M; Gutierrez-Osuna, R Neuromorphic processing for optical microbead arrays: dimensionality reduction and contrast enhancement Journal Article In: Sensors Journal, IEEE, vol. 7, no. 4, pp. 506–514, 2007. @article{raman2007neuromorphic,
title = {Neuromorphic processing for optical microbead arrays: dimensionality reduction and contrast enhancement},
author = {B Raman and T Kotseroglou and L Clark and M Lebl and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/raman2007neuromorphic.pdf},
year = {2007},
date = {2007-01-01},
journal = {Sensors Journal, IEEE},
volume = {7},
number = {4},
pages = {506--514},
publisher = {IEEE},
abstract = {This paper presents a neuromorphic approach for sensor-based machine olfaction that combines a portable chemical detection system based on microbead array technology with a biologically inspired model of signal processing in the olfactory bulb. The sensor array contains hundreds of microbeads coated with solvatochromic dyes adsorbed in, or covalently attached on, the matrix of various microspheres. When exposed to odors, each bead sensor responds with corresponding intensity changes, spectral shifts, and time-dependent variations associated with the fluorescent sensors. The bead array responses are subsequently processed using a model of olfactory circuits that capture the following two functions: chemotopic convergence of receptor neurons and center on-off surround lateral interactions. The first circuit performs dimensionality reduction, transforming the high-dimensional microbead array response into an organized spatial pattern (i.e., an odor image). The second circuit enhances the contrast of these spatial patterns, improving the separability of odors. The model is validated on an experimental dataset containing the responses of a large array of microbead sensors to five different analytes. Our results indicate that the model is able to significantly improve the separability between odor patterns, compared to that available from the raw sensor response.},
keywords = {Chemical sensors, Neuromorphic models},
pubstate = {published},
tppubtype = {article}
}
This paper presents a neuromorphic approach for sensor-based machine olfaction that combines a portable chemical detection system based on microbead array technology with a biologically inspired model of signal processing in the olfactory bulb. The sensor array contains hundreds of microbeads coated with solvatochromic dyes adsorbed in, or covalently attached on, the matrix of various microspheres. When exposed to odors, each bead sensor responds with corresponding intensity changes, spectral shifts, and time-dependent variations associated with the fluorescent sensors. The bead array responses are subsequently processed using a model of olfactory circuits that capture the following two functions: chemotopic convergence of receptor neurons and center on-off surround lateral interactions. The first circuit performs dimensionality reduction, transforming the high-dimensional microbead array response into an organized spatial pattern (i.e., an odor image). The second circuit enhances the contrast of these spatial patterns, improving the separability of odors. The model is validated on an experimental dataset containing the responses of a large array of microbead sensors to five different analytes. Our results indicate that the model is able to significantly improve the separability between odor patterns, compared to that available from the raw sensor response. |
2006
|
Raman, B; Yamanaka, T; Gutierrez-Osuna, R Contrast enhancement of gas sensor array patterns with a neurodynamics model of the olfactory bulb Journal Article In: Sensors and Actuators B: Chemical, vol. 119, no. 2, pp. 547–555, 2006. @article{raman2006contrast,
title = {Contrast enhancement of gas sensor array patterns with a neurodynamics model of the olfactory bulb},
author = {B Raman and T Yamanaka and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/raman2006contrast.pdf},
year = {2006},
date = {2006-01-01},
journal = {Sensors and Actuators B: Chemical},
volume = {119},
number = {2},
pages = {547--555},
publisher = {Elsevier},
abstract = {We propose a biologically inspired signal processing model capable of enhancing the discrimination of multivariate patterns from gassensorarrays. The model captures two functions in the early olfactorypathway: chemotopic convergence of sensory neurons onto the olfactorybulb, and center on–off surround lateral interactions. Sensor features are first topologically projected onto a two-dimensional lattice according to their selectivity profile, leading to odor-specific spatial patterning. The resulting patterns serve as inputs to a network of mitral cells with center on–off surround lateral inhibition, which enhances the initialcontrast among odors and decouples odor identity from intensity. The model is validated using experimental data from an array of temperature-modulated metal-oxide sensors. Our results indicate that the model is able to improve the separability between odor patterns that is available at the inputs.},
keywords = {Chemical sensors, Neuromorphic models},
pubstate = {published},
tppubtype = {article}
}
We propose a biologically inspired signal processing model capable of enhancing the discrimination of multivariate patterns from gassensorarrays. The model captures two functions in the early olfactorypathway: chemotopic convergence of sensory neurons onto the olfactorybulb, and center on–off surround lateral interactions. Sensor features are first topologically projected onto a two-dimensional lattice according to their selectivity profile, leading to odor-specific spatial patterning. The resulting patterns serve as inputs to a network of mitral cells with center on–off surround lateral inhibition, which enhances the initialcontrast among odors and decouples odor identity from intensity. The model is validated using experimental data from an array of temperature-modulated metal-oxide sensors. Our results indicate that the model is able to improve the separability between odor patterns that is available at the inputs. |
Gutierrez-Galvez, A; Gutierrez-Osuna, R Contrast enhancement and background suppression of chemosensor array patterns with the KIII model Journal Article In: International journal of intelligent systems, vol. 21, no. 9, pp. 937–953, 2006. @article{gutierrez2006contrast,
title = {Contrast enhancement and background suppression of chemosensor array patterns with the KIII model},
author = {A Gutierrez-Galvez and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2006contrast.pdf},
year = {2006},
date = {2006-01-01},
journal = {International journal of intelligent systems},
volume = {21},
number = {9},
pages = {937--953},
publisher = {Wiley Online Library},
abstract = {Inspired by the ability of the olfactory bulb to enhance the contrast between odor representations, we propose a new hebbian learning rule that is able to increase the separability of odor patterns from gas sensor arrays. The proposed learning rule employs a hebbian term to build associations within odors and an anti-hebbian term to reduce correlated activity across odors. In addition to increasing the separability of patterns, the new learning rule can also achieve odor background suppression when combined with a habituation term. These two functions are demonstrated on Freeman's KIII, a neurodynamics model of the olfactory system. The system is first characterized on synthetic data, and also validated on experimental data from an array of chemical sensors exposed to organic solvents.},
keywords = {Chemical sensors, Neuromorphic models},
pubstate = {published},
tppubtype = {article}
}
Inspired by the ability of the olfactory bulb to enhance the contrast between odor representations, we propose a new hebbian learning rule that is able to increase the separability of odor patterns from gas sensor arrays. The proposed learning rule employs a hebbian term to build associations within odors and an anti-hebbian term to reduce correlated activity across odors. In addition to increasing the separability of patterns, the new learning rule can also achieve odor background suppression when combined with a habituation term. These two functions are demonstrated on Freeman's KIII, a neurodynamics model of the olfactory system. The system is first characterized on synthetic data, and also validated on experimental data from an array of chemical sensors exposed to organic solvents. |
Gutierrez-Galvez, A; Gutierrez-Osuna, R Increasing the separability of chemosensor array patterns with Hebbian/anti-Hebbian learning Journal Article In: Sensors and Actuators B: Chemical, vol. 116, no. 1, pp. 29–35, 2006. @article{gutierrez2006increasing,
title = {Increasing the separability of chemosensor array patterns with Hebbian/anti-Hebbian learning},
author = {A Gutierrez-Galvez and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2006increasing.pdf},
year = {2006},
date = {2006-01-01},
journal = {Sensors and Actuators B: Chemical},
volume = {116},
number = {1},
pages = {29--35},
publisher = {Elsevier},
abstract = {The olfactory bulb is able to enhance the contrast between odor representations through a combination of excitatory and inhibitory circuits. Inspired by this mechanism, we propose a newHebbian/anti-Hebbianlearning rule to increase the separability of sensor-arraypatterns in a neurodynamics model of the olfactory system: the KIII. In the proposed learning rule, a Hebbian term is used to build associations within odors and an anti-Hebbian term is used to reduce correlated activity across odors. The KIII model with the new learning rule is characterized on synthetic data and validated on experimental data from an array of temperature-modulated metal-oxide sensors. Our results show that the performance of the model is comparable to that obtained with Linear Discriminant Analysis (LDA). Furthermore, the model is able to increase patternseparability for different concentrations of three odorants: allyl-alcohol, tert-butanol, and benzene, even though it is only trained with the gas sensor response to the highest concentration.},
keywords = {Chemical sensors, Neuromorphic models},
pubstate = {published},
tppubtype = {article}
}
The olfactory bulb is able to enhance the contrast between odor representations through a combination of excitatory and inhibitory circuits. Inspired by this mechanism, we propose a newHebbian/anti-Hebbianlearning rule to increase the separability of sensor-arraypatterns in a neurodynamics model of the olfactory system: the KIII. In the proposed learning rule, a Hebbian term is used to build associations within odors and an anti-Hebbian term is used to reduce correlated activity across odors. The KIII model with the new learning rule is characterized on synthetic data and validated on experimental data from an array of temperature-modulated metal-oxide sensors. Our results show that the performance of the model is comparable to that obtained with Linear Discriminant Analysis (LDA). Furthermore, the model is able to increase patternseparability for different concentrations of three odorants: allyl-alcohol, tert-butanol, and benzene, even though it is only trained with the gas sensor response to the highest concentration. |
Raman, B; Gutierrez-Osuna, R Concentration normalization with a model of gain control in the olfactory bulb Journal Article In: Sensors and Actuators B: Chemical, vol. 116, no. 1, pp. 36–42, 2006. @article{raman2006concentration,
title = {Concentration normalization with a model of gain control in the olfactory bulb},
author = {B Raman and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/raman2006concentration.pdf},
year = {2006},
date = {2006-01-01},
journal = {Sensors and Actuators B: Chemical},
volume = {116},
number = {1},
pages = {36--42},
publisher = {Elsevier},
abstract = {This article presents a biologically inspired model capable of removing concentration effects from the multivariate response of a gas sensor array. The model is based on the first stage of lateral inhibition in theolfactorybulb, which is mediated by periglomerular interneurons. To simulate inputs to the olfactorybulb, signals from a chemosensor array are first processed with a self-organizing model of chemotopic convergence proposed earlier, which leads to odor-specific spatial patterning. Subsequently, a shunting lateral inhibitory network, modeled after the role of periglomerular cells in the olfactorybulb, is used to compress concentration information. The model is validated using experimental data from an array of temperature-modulated metal-oxide chemoresistors.},
keywords = {Chemical sensors, Neuromorphic models},
pubstate = {published},
tppubtype = {article}
}
This article presents a biologically inspired model capable of removing concentration effects from the multivariate response of a gas sensor array. The model is based on the first stage of lateral inhibition in theolfactorybulb, which is mediated by periglomerular interneurons. To simulate inputs to the olfactorybulb, signals from a chemosensor array are first processed with a self-organizing model of chemotopic convergence proposed earlier, which leads to odor-specific spatial patterning. Subsequently, a shunting lateral inhibitory network, modeled after the role of periglomerular cells in the olfactorybulb, is used to compress concentration information. The model is validated using experimental data from an array of temperature-modulated metal-oxide chemoresistors. |
Perera-Lluna, A; Yamanaka, T; Gutierrez-Galvez, A; Raman, B; Gutierrez-Osuna, R A dimensionality-reduction technique inspired by receptor convergence in the olfactory system Journal Article In: Sensors and Actuators B: Chemical, vol. 116, no. 1, pp. 17–22, 2006. @article{perera2006dimensionality,
title = {A dimensionality-reduction technique inspired by receptor convergence in the olfactory system},
author = {A Perera-Lluna and T Yamanaka and A Gutierrez-Galvez and B Raman and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/perera2006dimensionality.pdf},
year = {2006},
date = {2006-01-01},
journal = {Sensors and Actuators B: Chemical},
volume = {116},
number = {1},
pages = {17--22},
publisher = {Elsevier},
abstract = {In this paper, we propose a new technique for feature extraction/selection based on the projection of sensor features in class space while taking into account the sensor variance. The proposed technique is inspired by the organization of the early stages in the biological olfactory system. The algorithm proves to be highly suitable for high-dimensional feature vectors. The performance shows robustness with problems where only a small number of samples are available as a training dataset. We demonstrate the method on experimental data from two metal oxide sensors driven by a sinusoidal temperature profile.},
keywords = {Neuromorphic models},
pubstate = {published},
tppubtype = {article}
}
In this paper, we propose a new technique for feature extraction/selection based on the projection of sensor features in class space while taking into account the sensor variance. The proposed technique is inspired by the organization of the early stages in the biological olfactory system. The algorithm proves to be highly suitable for high-dimensional feature vectors. The performance shows robustness with problems where only a small number of samples are available as a training dataset. We demonstrate the method on experimental data from two metal oxide sensors driven by a sinusoidal temperature profile. |
Raman, B; Sun, P A; Gutierrez-Galvez, A; Gutierrez-Osuna, R Processing of chemical sensor arrays with a biologically inspired model of olfactory coding Journal Article In: Neural Networks, IEEE Transactions on, vol. 17, no. 4, pp. 1015–1024, 2006. @article{raman2006processing,
title = {Processing of chemical sensor arrays with a biologically inspired model of olfactory coding},
author = {B Raman and P A Sun and A Gutierrez-Galvez and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/raman2006processing.pdf},
year = {2006},
date = {2006-01-01},
journal = {Neural Networks, IEEE Transactions on},
volume = {17},
number = {4},
pages = {1015--1024},
publisher = {IEEE},
abstract = {This paper presents a computational model for chemical sensor arrays inspired by the first two stages in the olfactory pathway: distributed coding with olfactory receptor neurons and chemotopic convergence onto glomerular units. We propose a monotonic concentration-response model that maps conventional sensor-array inputs into a distributed activation pattern across a large population of neuroreceptors. Projection onto glomerular units in the olfactory bulb is then simulated with a self-organizing model of chemotopic convergence. The pattern recognition performance of the model is characterized using a database of odor patterns from an array of temperature modulated chemical sensors. The chemotopic code achieved by the proposed model is shown to improve the signal-to-noise ratio available at the sensor inputs while being consistent with results from neurobiology.},
keywords = {Chemical sensors, Neuromorphic models},
pubstate = {published},
tppubtype = {article}
}
This paper presents a computational model for chemical sensor arrays inspired by the first two stages in the olfactory pathway: distributed coding with olfactory receptor neurons and chemotopic convergence onto glomerular units. We propose a monotonic concentration-response model that maps conventional sensor-array inputs into a distributed activation pattern across a large population of neuroreceptors. Projection onto glomerular units in the olfactory bulb is then simulated with a self-organizing model of chemotopic convergence. The pattern recognition performance of the model is characterized using a database of odor patterns from an array of temperature modulated chemical sensors. The chemotopic code achieved by the proposed model is shown to improve the signal-to-noise ratio available at the sensor inputs while being consistent with results from neurobiology. |
Kakumanu, P; Esposito, A; Garcia, O N; Gutierrez-Osuna, R A comparison of acoustic coding models for speech-driven facial animation Journal Article In: Speech communication, vol. 48, no. 6, pp. 598–615, 2006. @article{kakumanu2006comparison,
title = {A comparison of acoustic coding models for speech-driven facial animation},
author = {P Kakumanu and A Esposito and O N Garcia and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/kakumanu2006comparison.pdf},
year = {2006},
date = {2006-01-01},
journal = {Speech communication},
volume = {48},
number = {6},
pages = {598--615},
publisher = {Elsevier},
abstract = {This article presents a thorough experimental comparison of several acoustic modeling techniques by their ability to capture information related to orofacial motion. These models include (1) Linear Predictive Coding and Linear Spectral Frequencies, which model the dynamics of the speech production system, (2) Mel Frequency Cepstral Coefficients and Perceptual Critical Feature Bands, which encode perceptual cues of speech, (3) spectral energy and fundamental frequency, which capture prosodic aspects, and (4) two hybrid methods that combine information from the previous models. We also consider a novel supervised procedure based on Fisher’s Linear Discriminants to project acoustic information onto a low-dimensional subspace that best discriminates different orofacial configurations. Prediction of orofacial motion from speech acoustics is performed using a non-parametric k-nearest-neighbors procedure. The sensitivity of this audio–visual mapping to coarticulation effects and spatial locality is thoroughly investigated. Our results indicate that the hybrid use of articulatory, perceptual and prosodic features of speech, combined with a supervised dimensionality-reduction procedure, is able to outperform any individual acoustic model for speech-driven facial animation. These results are validated on the 450 sentences of the TIMIT compact dataset.},
keywords = {Facial animation},
pubstate = {published},
tppubtype = {article}
}
This article presents a thorough experimental comparison of several acoustic modeling techniques by their ability to capture information related to orofacial motion. These models include (1) Linear Predictive Coding and Linear Spectral Frequencies, which model the dynamics of the speech production system, (2) Mel Frequency Cepstral Coefficients and Perceptual Critical Feature Bands, which encode perceptual cues of speech, (3) spectral energy and fundamental frequency, which capture prosodic aspects, and (4) two hybrid methods that combine information from the previous models. We also consider a novel supervised procedure based on Fisher’s Linear Discriminants to project acoustic information onto a low-dimensional subspace that best discriminates different orofacial configurations. Prediction of orofacial motion from speech acoustics is performed using a non-parametric k-nearest-neighbors procedure. The sensitivity of this audio–visual mapping to coarticulation effects and spatial locality is thoroughly investigated. Our results indicate that the hybrid use of articulatory, perceptual and prosodic features of speech, combined with a supervised dimensionality-reduction procedure, is able to outperform any individual acoustic model for speech-driven facial animation. These results are validated on the 450 sentences of the TIMIT compact dataset. |
2005
|
Raman, B; Gutierrez-Osuna, R Concentration normalization with a model of gain control in the olfactory bulb Journal Article In: Sensors and Actuators B: Chemical, vol. 116, no. 1, pp. 36-42, 2005. @article{raman2005sensors,
title = {Concentration normalization with a model of gain control in the olfactory bulb},
author = {B Raman and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/raman2005sensors.pdf},
year = {2005},
date = {2005-04-13},
booktitle = {Proceedings of the 11th International Symposium on Olfaction and Electronic Nose},
journal = {Sensors and Actuators B: Chemical},
volume = {116},
number = {1},
pages = {36-42},
abstract = {This article presents a biologically-inspired model to remove concentration effects from the multivariate response of a gas sensor array. The model is based on the first stage of lateral inhibition in the olfactory bulb, mediated by periglomerular interneurons. To simulate inputs to the olfactory bulb, sensor-array data are processed with a self-organizing model of chemotopic convergence proposed earlier, which leads to odorspecific spatial patterning. Subsequently, a shunting lateral inhibitory network, modeled after the role of periglomerular cells, compresses the concentration information. The model is validated using experimental data from an array of temperature-modulated metaloxide sensors.},
keywords = {Chemical sensors, Neuromorphic models, Temperature modulation},
pubstate = {published},
tppubtype = {article}
}
This article presents a biologically-inspired model to remove concentration effects from the multivariate response of a gas sensor array. The model is based on the first stage of lateral inhibition in the olfactory bulb, mediated by periglomerular interneurons. To simulate inputs to the olfactory bulb, sensor-array data are processed with a self-organizing model of chemotopic convergence proposed earlier, which leads to odorspecific spatial patterning. Subsequently, a shunting lateral inhibitory network, modeled after the role of periglomerular cells, compresses the concentration information. The model is validated using experimental data from an array of temperature-modulated metaloxide sensors. |
Yu, Y; Gutierrez-Osuna, R; Choe, Y Preserving Class Discriminatory Information by Context-Sensitve Intra-Class Clustering Algorithm Technical Report 2005. @techreport{yu2005techreport,
title = {Preserving Class Discriminatory Information by Context-Sensitve Intra-Class Clustering Algorithm},
author = {Y Yu and R Gutierrez-Osuna and Y Choe},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/yu05techreport.pdf},
year = {2005},
date = {2005-02-25},
abstract = {Many powerful techniques in supervised learning (e.g. linear discriminant analysis, LDA, and quadratic classifier) assume that data in each class have a single Gaussian distribution. In reality, data in the class of interest, i.e., the object class, could have non-Gaussian distributions and could be isolated into several subgroups by the data from other classes (the context classes). To address this problem, one possible way is to partition one class into several subclasses. This intra-class clustering should depend on the data structure of the class of interest (object class) as well as the distributions of all other classes (context classes). In this paper, we presented a novel method of intra-class clustering which can divide a non-Gaussian class data into several Gaussian-like clusters, and at the same time this algorithm is context sensitive, which can maximally reduce the overlapping among resulting classes and also between the object class and the context classes. The method can serve as a general data preprocessing method to improve performance of supervised learning algorithms such as LDA and quadratic classifiers.},
keywords = {Pattern recognition},
pubstate = {published},
tppubtype = {techreport}
}
Many powerful techniques in supervised learning (e.g. linear discriminant analysis, LDA, and quadratic classifier) assume that data in each class have a single Gaussian distribution. In reality, data in the class of interest, i.e., the object class, could have non-Gaussian distributions and could be isolated into several subgroups by the data from other classes (the context classes). To address this problem, one possible way is to partition one class into several subclasses. This intra-class clustering should depend on the data structure of the class of interest (object class) as well as the distributions of all other classes (context classes). In this paper, we presented a novel method of intra-class clustering which can divide a non-Gaussian class data into several Gaussian-like clusters, and at the same time this algorithm is context sensitive, which can maximally reduce the overlapping among resulting classes and also between the object class and the context classes. The method can serve as a general data preprocessing method to improve performance of supervised learning algorithms such as LDA and quadratic classifiers. |
Raman, B; Gutierrez-Osuna, R Mixture segmentation and background suppression in chemosensor arrays with a model of olfactory bulb-cortex interaction Conference Proceedings of IEEE International Joint Conference on Neural Networks, IEEE 2005. @conference{raman2005ijcnn,
title = {Mixture segmentation and background suppression in chemosensor arrays with a model of olfactory bulb-cortex interaction},
author = {B Raman and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/raman2005ijcnn.pdf},
year = {2005},
date = {2005-01-01},
booktitle = {Proceedings of IEEE International Joint Conference on Neural Networks},
pages = {131--136},
organization = {IEEE},
abstract = {We present a model of olfactory bulb-cortex interaction for the purpose of mixture processing with gas sensor arrays. The olfactory bulb is modeled with a neurodynamic model whose lateral inhibitory connections are learned through a modified Hebbian-anti-Hebbian rule. Bulbar outputs are then projected in a non-topographic fashion onto the olfactory cortex. Associational connections within cortex using Hebbian learning form a content addressable memory. Finally, inhibitory feedback from cortex is used to modulate bulbar activity. Depending on the form of feedback, Hebbian or anti-Hebbian, the model is able to perform background suppression or mixture segmentation. The model is validated on experimental data from a gas sensor array.},
keywords = {Chemical sensors, Neuromorphic models},
pubstate = {published},
tppubtype = {conference}
}
We present a model of olfactory bulb-cortex interaction for the purpose of mixture processing with gas sensor arrays. The olfactory bulb is modeled with a neurodynamic model whose lateral inhibitory connections are learned through a modified Hebbian-anti-Hebbian rule. Bulbar outputs are then projected in a non-topographic fashion onto the olfactory cortex. Associational connections within cortex using Hebbian learning form a content addressable memory. Finally, inhibitory feedback from cortex is used to modulate bulbar activity. Depending on the form of feedback, Hebbian or anti-Hebbian, the model is able to perform background suppression or mixture segmentation. The model is validated on experimental data from a gas sensor array. |
Gutierrez-Galvez, A; Gutierrez-Osuna, R Contrast enhancement of sensor-array patterns through hebbian/antihebbian learning Conference Proceedings of the 11th International Symposium on Olfaction and Electronic Nose, 2005. @conference{gutierrez2005contrast,
title = {Contrast enhancement of sensor-array patterns through hebbian/antihebbian learning},
author = {A Gutierrez-Galvez and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2005isoen.pdf},
year = {2005},
date = {2005-01-01},
booktitle = {Proceedings of the 11th International Symposium on Olfaction and Electronic Nose},
abstract = {The olfactory bulb is able to enhance the contrast between odor representations through a combination of excitatory and inhibitory circuits. Inspired by this mechanism, we propose a new Hebbian/anti-Hebbian learning rule to increase the contrast of sensor-array patterns in a neurodynamics model of the olfactory system: the KIII. In the proposed learning rule, a Hebbian term is used to build associations within odors and an anti-Hebbian term is used to reduce correlated activity across odors. The system is characterized on synthetic data showing its ability to increase the separation between patterns and its robustness against noise. Experimental data from an array of temperature-modulated metal-oxide sensors is used to validate the contrast enhancement ability of the system.},
keywords = {Chemical sensors, Neuromorphic models},
pubstate = {published},
tppubtype = {conference}
}
The olfactory bulb is able to enhance the contrast between odor representations through a combination of excitatory and inhibitory circuits. Inspired by this mechanism, we propose a new Hebbian/anti-Hebbian learning rule to increase the contrast of sensor-array patterns in a neurodynamics model of the olfactory system: the KIII. In the proposed learning rule, a Hebbian term is used to build associations within odors and an anti-Hebbian term is used to reduce correlated activity across odors. The system is characterized on synthetic data showing its ability to increase the separation between patterns and its robustness against noise. Experimental data from an array of temperature-modulated metal-oxide sensors is used to validate the contrast enhancement ability of the system. |
Fu, S; Gutierrez-Osuna, R; Esposito, A; Kakumanu, P; Garcia, O N Audio/visual mapping with cross-modal hidden Markov models Journal Article In: Multimedia, IEEE Transactions on, vol. 7, no. 2, pp. 243–252, 2005. @article{fu2005tmm,
title = {Audio/visual mapping with cross-modal hidden Markov models},
author = {S Fu and R Gutierrez-Osuna and A Esposito and P Kakumanu and O N Garcia},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/fu2005tmm.pdf},
year = {2005},
date = {2005-01-01},
journal = {Multimedia, IEEE Transactions on},
volume = {7},
number = {2},
pages = {243--252},
publisher = {IEEE},
abstract = {The audio/visual mapping problem of speech-driven facial animation has intrigued researchers for years. Recent research efforts have demonstrated that hidden Markov model (HMM) techniques, which have been applied successfully to the problem of speech recognition, could achieve a similar level of success in audio/visual mapping problems. A number of HMM-based methods have been proposed and shown to be effective by the respective designers, but it is yet unclear how these techniques compare to each other on a common test bed. In this paper, we quantitatively compare three recently proposed cross-modal HMM methods, namely the remapping HMM (R-HMM), the least-mean-squared HMM (LMS-HMM), and HMM inversion (HMMI). The objective of our comparison is not only to highlight the merits and demerits of different mapping designs, but also to study the optimality of the acoustic representation and HMM structure for the purpose of speech-driven facial animation. This paper presents a brief overview of these models, followed by an analysis of their mapping capabilities on a synthetic dataset. An empirical comparison on an experimental audio-visual dataset consisting of 75 TIMIT sentences is finally presented. Our results show that HMMI provides the best performance, both on synthetic and experimental audio-visual data.},
keywords = {Facial animation},
pubstate = {published},
tppubtype = {article}
}
The audio/visual mapping problem of speech-driven facial animation has intrigued researchers for years. Recent research efforts have demonstrated that hidden Markov model (HMM) techniques, which have been applied successfully to the problem of speech recognition, could achieve a similar level of success in audio/visual mapping problems. A number of HMM-based methods have been proposed and shown to be effective by the respective designers, but it is yet unclear how these techniques compare to each other on a common test bed. In this paper, we quantitatively compare three recently proposed cross-modal HMM methods, namely the remapping HMM (R-HMM), the least-mean-squared HMM (LMS-HMM), and HMM inversion (HMMI). The objective of our comparison is not only to highlight the merits and demerits of different mapping designs, but also to study the optimality of the acoustic representation and HMM structure for the purpose of speech-driven facial animation. This paper presents a brief overview of these models, followed by an analysis of their mapping capabilities on a synthetic dataset. An empirical comparison on an experimental audio-visual dataset consisting of 75 TIMIT sentences is finally presented. Our results show that HMMI provides the best performance, both on synthetic and experimental audio-visual data. |
Gutierrez-Osuna, R; Kakumanu, P; Esposito, A; Garcia, ON; Bojorquez, A; Castillo, JL; Rudomin, I Speech-driven facial animation with realistic dynamics Journal Article In: Multimedia, IEEE Transactions on, vol. 7, no. 1, pp. 33–42, 2005. @article{gutierrez2005tmm,
title = {Speech-driven facial animation with realistic dynamics},
author = {R Gutierrez-Osuna and P Kakumanu and A Esposito and ON Garcia and A Bojorquez and JL Castillo and I Rudomin},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2005tmm.pdf},
year = {2005},
date = {2005-01-01},
journal = {Multimedia, IEEE Transactions on},
volume = {7},
number = {1},
pages = {33--42},
publisher = {IEEE},
abstract = {This work presents an integral system capable of generating animations with realistic dynamics, including the individualized nuances, of three-dimensional (3-D) human faces driven by speech acoustics. The system is capable of capturing short phenomena in the orofacial dynamics of a given speaker by tracking the 3-D location of various MPEG-4 facial points through stereovision. A perceptual transformation of the speech spectral envelope and prosodic cues are combined into an acoustic feature vector to predict 3-D orofacial dynamics by means of a nearest-neighbor algorithm. The Karhunen-Loe´ve transformation is used to identify the principal components of orofacial motion, decoupling perceptually natural components from experimental noise. We also present a highly optimized MPEG-4 compliant player capable of generating audio-synchronized animations at 60 frames/s. The player is based on a pseudo-muscle model augmented with a nonpenetrable ellipsoidal structure to approximate the skull and the jaw. This structure adds a sense of volume that provides more realistic dynamics than existing simplified pseudo-muscle-based approaches, yet it is simple enough to work at the desired frame rate. Experimental results on an audiovisual database of compact TIMIT sentences are presented to illustrate the performance of the complete system.},
keywords = {Facial animation, Speech},
pubstate = {published},
tppubtype = {article}
}
This work presents an integral system capable of generating animations with realistic dynamics, including the individualized nuances, of three-dimensional (3-D) human faces driven by speech acoustics. The system is capable of capturing short phenomena in the orofacial dynamics of a given speaker by tracking the 3-D location of various MPEG-4 facial points through stereovision. A perceptual transformation of the speech spectral envelope and prosodic cues are combined into an acoustic feature vector to predict 3-D orofacial dynamics by means of a nearest-neighbor algorithm. The Karhunen-Loe&acute;ve transformation is used to identify the principal components of orofacial motion, decoupling perceptually natural components from experimental noise. We also present a highly optimized MPEG-4 compliant player capable of generating audio-synchronized animations at 60 frames/s. The player is based on a pseudo-muscle model augmented with a nonpenetrable ellipsoidal structure to approximate the skull and the jaw. This structure adds a sense of volume that provides more realistic dynamics than existing simplified pseudo-muscle-based approaches, yet it is simple enough to work at the desired frame rate. Experimental results on an audiovisual database of compact TIMIT sentences are presented to illustrate the performance of the complete system. |
Perera-Lluna, A; Yamanaka, T; Gutierrez-Gálvez, A; Raman, B; Gutierrez-Osuna, R A dimensionality-reduction technique inspired by receptor convergence in the olfactory system Conference Proceedings of the 11th International Symposium on Olfaction and Electronic Nose, 2005. @conference{perera2005isoen,
title = {A dimensionality-reduction technique inspired by receptor convergence in the olfactory system},
author = {A Perera-Lluna and T Yamanaka and A Gutierrez-Gálvez and B Raman and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/perera2005isoen.pdf},
year = {2005},
date = {2005-01-01},
booktitle = {Proceedings of the 11th International Symposium on Olfaction and Electronic Nose},
abstract = {In this paper we propose a new technique for feature extraction/selection based on the projection of sensor features in class space and taking into account the sensor variance. The proposed technique is inspired by the organization of the early stages in the biological olfactory system, and proves to be highly suitable for high-dimensional feature vectors with small number of training samples. We demonstrate the method on experimental data from two metal oxide sensors driven by a sinusoidal temperature profile.},
keywords = {Neuromorphic models},
pubstate = {published},
tppubtype = {conference}
}
In this paper we propose a new technique for feature extraction/selection based on the projection of sensor features in class space and taking into account the sensor variance. The proposed technique is inspired by the organization of the early stages in the biological olfactory system, and proves to be highly suitable for high-dimensional feature vectors with small number of training samples. We demonstrate the method on experimental data from two metal oxide sensors driven by a sinusoidal temperature profile. |
2004
|
Gutierrez-Galvez, A; Gutierrez-Osuna, R; Raman, B Pattern recognition for chemosensor arrays with the KIII model Conference Proceedings of the 2004 Symposium on Intentional Dynamic Systems, 2004. @conference{gutierrez2004pattern,
title = {Pattern recognition for chemosensor arrays with the KIII model},
author = {A Gutierrez-Galvez and R Gutierrez-Osuna and B Raman},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2004pattern.pdf},
year = {2004},
date = {2004-04-24},
booktitle = {Proceedings of the 2004 Symposium on Intentional Dynamic Systems},
journal = {Proc. 2004 Symposium on Intentional Dynamic Systems},
pages = {24--26},
keywords = {Chemical sensors, Neuromorphic models},
pubstate = {published},
tppubtype = {conference}
}
|
Gutierrez-Osuna, R; Raman, B Cancellation of chemical backgrounds with generalized Fisher's linear discriminants Conference Proceedings of IEEE Sensors, IEEE 2004. @conference{gutierrez2004cancellation,
title = {Cancellation of chemical backgrounds with generalized Fisher's linear discriminants},
author = {R Gutierrez-Osuna and B Raman},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2004cancellation.pdf},
year = {2004},
date = {2004-01-01},
booktitle = {Proceedings of IEEE Sensors},
pages = {1381--1384},
organization = {IEEE},
abstract = {This article presents a signal-processing technique capable of canceling the effect of background chemicals from the multivariate response of a sensor array. We propose a generalization of the Fishers eigenvalue solution that minimizes the discrimination between undesirable chemicals and a neutral reference. The proposed technique is a generalization of an earlier model that was limited to the removal of single volatiles. A reformulation of class memberships allows the new model to cancel the effect of both single and mixture backgrounds. The model is validated on experimental data from an array of temperature-modulated metal-oxide sensors exposed to binary and ternary mixtures.},
keywords = {Chemical sensors},
pubstate = {published},
tppubtype = {conference}
}
This article presents a signal-processing technique capable of canceling the effect of background chemicals from the multivariate response of a sensor array. We propose a generalization of the Fishers eigenvalue solution that minimizes the discrimination between undesirable chemicals and a neutral reference. The proposed technique is a generalization of an earlier model that was limited to the removal of single volatiles. A reformulation of class memberships allows the new model to cancel the effect of both single and mixture backgrounds. The model is validated on experimental data from an array of temperature-modulated metal-oxide sensors exposed to binary and ternary mixtures. |
Wang, M; Perera-Lluna, A; Gutierrez-Osuna, R Principal Discriminants Analysis for small-sample-size problems: application to chemical sensing Conference Proceedings of IEEE Sensors, IEEE 2004. @conference{wang2004principal,
title = {Principal Discriminants Analysis for small-sample-size problems: application to chemical sensing},
author = {M Wang and A Perera-Lluna and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/wang2004principal.pdf},
year = {2004},
date = {2004-01-01},
booktitle = {Proceedings of IEEE Sensors},
pages = {591-594},
organization = {IEEE},
abstract = {Two dimensionality reduction techniques are widely used to analyze data from chemical sensor arrays: Fisher's linear discriminants analysis (LDA) and principal components analysis (PCA). LDA finds the directions of maximum discrimination in classification problems, but has a tendency to overfit when the ratio of training samples to dimensionality is low, as is commonly the case in chemical sensor array problems. PCA is more robust to overfitting but, being a variance model, fails to capture discriminatory information in low-variance sensors. In this article we propose a hybrid model, termed principal discriminants analysis (PDA), which incorporates both LDA and PCA criteria by means of a regularization parameter. The model is characterized on a synthetic dataset and validated with experimental data from an array of 15 metal-oxide sensors exposed to five varieties of roasted coffee beans. Our results show that PDA provides higher predictive accuracy than LDA or PCA alone. In addition, the model is able to find a trade-off between discriminant- and variance-based projections according to where information is located in the distribution of the data.},
keywords = {Chemical sensors},
pubstate = {published},
tppubtype = {conference}
}
Two dimensionality reduction techniques are widely used to analyze data from chemical sensor arrays: Fisher's linear discriminants analysis (LDA) and principal components analysis (PCA). LDA finds the directions of maximum discrimination in classification problems, but has a tendency to overfit when the ratio of training samples to dimensionality is low, as is commonly the case in chemical sensor array problems. PCA is more robust to overfitting but, being a variance model, fails to capture discriminatory information in low-variance sensors. In this article we propose a hybrid model, termed principal discriminants analysis (PDA), which incorporates both LDA and PCA criteria by means of a regularization parameter. The model is characterized on a synthetic dataset and validated with experimental data from an array of 15 metal-oxide sensors exposed to five varieties of roasted coffee beans. Our results show that PDA provides higher predictive accuracy than LDA or PCA alone. In addition, the model is able to find a trade-off between discriminant- and variance-based projections according to where information is located in the distribution of the data. |
Raman, B; Gutierrez-Galvez, A; Perera-Lluna, A; Gutierrez-Osuna, R Sensor-based machine olfaction with a neurodynamics model of the olfactory bulb Conference Proceedings of IEEE/RSJ International Conference on Intelligent Robots and Systems, IEEE 2004. @conference{raman2004sensor,
title = {Sensor-based machine olfaction with a neurodynamics model of the olfactory bulb},
author = {B Raman and A Gutierrez-Galvez and A Perera-Lluna and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/raman2004sensor.pdf},
year = {2004},
date = {2004-01-01},
booktitle = {Proceedings of IEEE/RSJ International Conference on Intelligent Robots and Systems},
pages = {319--324},
organization = {IEEE},
abstract = {We propose a biologically inspired model of olfactory processing for chemosensor arrays. The model captures three functions in the early olfactory pathway: chemotopic convergence of receptor neurons onto the olfactory bulb, center on-off surround lateral interactions, and adaptation to sustained stimuli. The projection of ORNs onto glomerular units is simulated with a self-organizing model of chemotopic convergence, which leads to odor specific spatial patterning. This information serves as an input to a network of mitral cells with center on-off surround lateral inhibition, which enhances the initial contrast among odors and decouples odor identity from intensity. Finally, slow adaptation of mitral cells adds a temporal dimension to the spatial patterns that further enhances odor discrimination. The model is validated using experimental data from an array of temperature-modulated metal-oxide sensors.},
keywords = {Machine olfaction, Metal-oxide sensors, Neuromorphic models},
pubstate = {published},
tppubtype = {conference}
}
We propose a biologically inspired model of olfactory processing for chemosensor arrays. The model captures three functions in the early olfactory pathway: chemotopic convergence of receptor neurons onto the olfactory bulb, center on-off surround lateral interactions, and adaptation to sustained stimuli. The projection of ORNs onto glomerular units is simulated with a self-organizing model of chemotopic convergence, which leads to odor specific spatial patterning. This information serves as an input to a network of mitral cells with center on-off surround lateral inhibition, which enhances the initial contrast among odors and decouples odor identity from intensity. Finally, slow adaptation of mitral cells adds a temporal dimension to the spatial patterns that further enhances odor discrimination. The model is validated using experimental data from an array of temperature-modulated metal-oxide sensors. |
Rodriguez-Mendez, M L; Arrieta, A; Parra, V; Bernal, A; Vegas, A; Villanueva, S; Gutierrez-Osuna, R; de Saja, J A Fusion of three sensory modalities for the multimodal characterization of red wines Journal Article In: Sensors Journal, IEEE, vol. 4, no. 3, pp. 348–354, 2004. @article{rodrÃguez2004fusion,
title = {Fusion of three sensory modalities for the multimodal characterization of red wines},
author = {M L Rodriguez-Mendez and A Arrieta and V Parra and A Bernal and A Vegas and S Villanueva and R Gutierrez-Osuna and J A de Saja},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/rodrÃguez2004fusion.pdf},
year = {2004},
date = {2004-01-01},
journal = {Sensors Journal, IEEE},
volume = {4},
number = {3},
pages = {348--354},
publisher = {IEEE},
abstract = {This work represents the first attempt to develop a sensory system, specifically designed for the characterization of wines, which combines three sensory modalities: an array of gas sensors, an array of electrochemical liquid sensors, and an optical system to measure color by means of CIElab coordinates. This new analytical tool, that has been called "electronic panel," includes not only sensors, but also hardware (injection system and electronics) and the software necessary for fusing information from the three modules. Each of the three sensory modalities (volatiles, liquids, and color) has been designed, tested, and optimized separately. The discrimination capabilities of the system have been evaluated on a database consisting of six red Spanish wines prepared using the same variety of grape (tempranillo) but differing in their geographic origins and aging stages. Sensor signals from each module have been combined and analyzed using pattern recognition techniques. The results of this work show that the discrimination capabilities of the system are significantly improved when signals from each module are combined to form a multimodal feature vector.},
keywords = {Chemical sensors, Electronic nose},
pubstate = {published},
tppubtype = {article}
}
This work represents the first attempt to develop a sensory system, specifically designed for the characterization of wines, which combines three sensory modalities: an array of gas sensors, an array of electrochemical liquid sensors, and an optical system to measure color by means of CIElab coordinates. This new analytical tool, that has been called "electronic panel," includes not only sensors, but also hardware (injection system and electronics) and the software necessary for fusing information from the three modules. Each of the three sensory modalities (volatiles, liquids, and color) has been designed, tested, and optimized separately. The discrimination capabilities of the system have been evaluated on a database consisting of six red Spanish wines prepared using the same variety of grape (tempranillo) but differing in their geographic origins and aging stages. Sensor signals from each module have been combined and analyzed using pattern recognition techniques. The results of this work show that the discrimination capabilities of the system are significantly improved when signals from each module are combined to form a multimodal feature vector. |
Pasini, P; Powar, N; Gutierrez-Osuna, R; Daunert, S; Roda, A Use of a gas-sensor array for detecting volatile organic compounds (VOC) in chemically induced cells Journal Article In: Analytical and bioanalytical chemistry, vol. 378, no. 1, pp. 76–83, 2004. @article{pasini2004use,
title = {Use of a gas-sensor array for detecting volatile organic compounds (VOC) in chemically induced cells},
author = {P Pasini and N Powar and R Gutierrez-Osuna and S Daunert and A Roda},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/pasini2004use.pdf},
year = {2004},
date = {2004-01-01},
journal = {Analytical and bioanalytical chemistry},
volume = {378},
number = {1},
pages = {76--83},
publisher = {Springer},
abstract = {An application of gas sensors for rapid bioanalysis is presented. An array of temperature-modulated semiconductor sensors was used to characterize the headspace above a cell culture. Recombinant Saccharomyces cerevisiae yeast cells, able to respond to 17β-estradiol by producing a reporter protein, were used as a model system. Yeast cells had the DNA sequence of the human estrogen receptor stably integrated into the genome, and contained expression plasmids carrying estrogen-responsive sequences and the reporter gene lac-Z, encoding the enzyme β-galactosidase. The sensor-response profiles showed small but noticeable discrimination between cell samples induced with 17β-estradiol and non-induced cell samples. The sensor array was capable of detecting changes in the volatile organic compound composition of the headspace above the cultured cells, which can be associated with metabolic changes induced by a chemical compound. This finding suggests the possibility of using cross-selective gas-sensor arrays for analysis of drugs or bioactive molecules through their interaction with cell systems, with the advantage of providing information on their bioavailability.},
keywords = {Chemical sensors, Metal-oxide sensors, Temperature modulation},
pubstate = {published},
tppubtype = {article}
}
An application of gas sensors for rapid bioanalysis is presented. An array of temperature-modulated semiconductor sensors was used to characterize the headspace above a cell culture. Recombinant Saccharomyces cerevisiae yeast cells, able to respond to 17β-estradiol by producing a reporter protein, were used as a model system. Yeast cells had the DNA sequence of the human estrogen receptor stably integrated into the genome, and contained expression plasmids carrying estrogen-responsive sequences and the reporter gene lac-Z, encoding the enzyme β-galactosidase. The sensor-response profiles showed small but noticeable discrimination between cell samples induced with 17β-estradiol and non-induced cell samples. The sensor array was capable of detecting changes in the volatile organic compound composition of the headspace above the cultured cells, which can be associated with metabolic changes induced by a chemical compound. This finding suggests the possibility of using cross-selective gas-sensor arrays for analysis of drugs or bioactive molecules through their interaction with cell systems, with the advantage of providing information on their bioavailability. |
Raman, B; Gutierrez-Osuna, R Chemosensory processing in a spiking model of the olfactory bulb: chemotopic convergence and center surround inhibition Conference NIPS, 2004. @conference{raman2004chemosensory,
title = {Chemosensory processing in a spiking model of the olfactory bulb: chemotopic convergence and center surround inhibition},
author = {B Raman and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/raman2004chemosensory.pdf},
year = {2004},
date = {2004-01-01},
booktitle = {NIPS},
abstract = {This paper presents a neuromorphic model of two olfactory signalprocessing primitives: chemotopic convergence of olfactory receptor neurons, and center on-off surround lateral inhibition in the olfactory bulb. A self-organizing model of receptor convergence onto glomeruli is used to generate a spatially organized map, an olfactory image. This map serves as input to a lattice of spiking neurons with lateral connections. The dynamics of this recurrent network transforms the initial olfactory image into a spatio-temporal pattern that evolves and stabilizes into odor- and intensity-coding attractors. The model is validated using experimental data from an array of temperature-modulated gas sensors. Our results are consistent with recent neurobiological findings on the antennal lobe of the honeybee and the locust.},
keywords = {Neuromorphic models},
pubstate = {published},
tppubtype = {conference}
}
This paper presents a neuromorphic model of two olfactory signalprocessing primitives: chemotopic convergence of olfactory receptor neurons, and center on-off surround lateral inhibition in the olfactory bulb. A self-organizing model of receptor convergence onto glomeruli is used to generate a spatially organized map, an olfactory image. This map serves as input to a lattice of spiking neurons with lateral connections. The dynamics of this recurrent network transforms the initial olfactory image into a spatio-temporal pattern that evolves and stabilizes into odor- and intensity-coding attractors. The model is validated using experimental data from an array of temperature-modulated gas sensors. Our results are consistent with recent neurobiological findings on the antennal lobe of the honeybee and the locust. |
Gutierrez-Osuna, R Olfactory Interaction Book Chapter In: Encyclopedia of Human-Computer Interaction, pp. 507-511, Berkshire Publishing Group, 2004. @inbook{gutierrez04interaction,
title = {Olfactory Interaction},
author = {R Gutierrez-Osuna},
year = {2004},
date = {2004-01-01},
booktitle = {Encyclopedia of Human-Computer Interaction},
pages = {507-511},
publisher = {Berkshire Publishing Group},
keywords = {Olfaction},
pubstate = {published},
tppubtype = {inbook}
}
|
2003
|
Florkey, L; Gutierrez-Osuna, R; Bullock, J D Computer-Aided Pattern Recognition in the Classification of Superficial Corneal Injuries Conference Proceedings of the Annual Meeting of the American Academy of Optometry, 2003. @conference{florkey03corneal,
title = {Computer-Aided Pattern Recognition in the Classification of Superficial Corneal Injuries},
author = {L Florkey and R Gutierrez-Osuna and J D Bullock},
year = {2003},
date = {2003-12-04},
booktitle = {Proceedings of the Annual Meeting of the American Academy of Optometry},
keywords = {Pattern recognition},
pubstate = {published},
tppubtype = {conference}
}
|
Pasini, P; Powar, N; Gutierrez-Osuna, R; Daunert, S; Roda, A Use of an electronic nose for the identification of genetically modified organisms Conference Proceedings of the 21st National Congress of the Italian Chemical Society, 2003. @conference{pasini03use,
title = {Use of an electronic nose for the identification of genetically modified organisms},
author = {P Pasini and N Powar and R Gutierrez-Osuna and S Daunert and A Roda},
year = {2003},
date = {2003-06-22},
booktitle = {Proceedings of the 21st National Congress of the Italian Chemical Society},
keywords = {Electronic nose},
pubstate = {published},
tppubtype = {conference}
}
|
Gutierrez-Osuna, R; Gutierrez-Galvez, A Habituation in the KIII olfactory model with chemical sensor arrays Journal Article In: Neural Networks, IEEE Transactions on, vol. 14, no. 6, pp. 1565–1568, 2003. @article{gutierrez2003habituation,
title = {Habituation in the KIII olfactory model with chemical sensor arrays},
author = {R Gutierrez-Osuna and A Gutierrez-Galvez},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2003habituation.pdf},
year = {2003},
date = {2003-01-01},
journal = {Neural Networks, IEEE Transactions on},
volume = {14},
number = {6},
pages = {1565--1568},
publisher = {IEEE},
abstract = {This paper presents a novel combination of chemical sensors and the KIII model for simulating mixture perception with a habituation process triggered by local activity. Stimuli are generated by partitioning feature space with labeled lines. Pattern completion is demonstrated through coherent oscillations across granule populations using experimental odor mixtures.},
keywords = {Chemical sensors, Neuromorphic models},
pubstate = {published},
tppubtype = {article}
}
This paper presents a novel combination of chemical sensors and the KIII model for simulating mixture perception with a habituation process triggered by local activity. Stimuli are generated by partitioning feature space with labeled lines. Pattern completion is demonstrated through coherent oscillations across granule populations using experimental odor mixtures. |
Mousavi, M J; Butler-Purry, K L; Gutierrez-Osuna, R; Najafi, M Classification of load change transients and incipient abnormalities in underground cable using pattern analysis techniques Conference Proceedings of 2003 IEEE PES Transmission and Distribution Conference and Exposition, IEEE 2003. @conference{mousavi2003classification,
title = {Classification of load change transients and incipient abnormalities in underground cable using pattern analysis techniques},
author = {M J Mousavi and K L Butler-Purry and R Gutierrez-Osuna and M Najafi},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/mousavi2003tdce.pdf},
year = {2003},
date = {2003-01-01},
booktitle = {Proceedings of 2003 IEEE PES Transmission and Distribution Conference and Exposition},
pages = {175--180},
organization = {IEEE},
abstract = {This paper presents a feasibility study on the application of pattern analysis techniques to classify load change transients and incipient abnormalities in an underground distribution cable lateral. The data were collected using an on-line monitoring system installed in a residential area in Dallas. A set of features obtained from wavelet packet analysis was evaluated. Methods of dimensionality reduction were employed to overcome the curse of dimensionality while preserving a good classification rate. The classification results using k-nearest-neighbor (KNN) classifiers show that the proposed methodology can be used to classify load change transients and incipient abnormalities.},
keywords = {Pattern recognition},
pubstate = {published},
tppubtype = {conference}
}
This paper presents a feasibility study on the application of pattern analysis techniques to classify load change transients and incipient abnormalities in an underground distribution cable lateral. The data were collected using an on-line monitoring system installed in a residential area in Dallas. A set of features obtained from wavelet packet analysis was evaluated. Methods of dimensionality reduction were employed to overcome the curse of dimensionality while preserving a good classification rate. The classification results using k-nearest-neighbor (KNN) classifiers show that the proposed methodology can be used to classify load change transients and incipient abnormalities. |
Gutierrez-Osuna, R; Gutierrez-Galvez, A; Powar, N Transient response analysis for temperature-modulated chemoresistors Journal Article In: Sensors and Actuators B: Chemical, vol. 93, no. 1-3, pp. 57–66, 2003. @article{gutierrez2003transient,
title = {Transient response analysis for temperature-modulated chemoresistors},
author = {R Gutierrez-Osuna and A Gutierrez-Galvez and N Powar},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2003transient.pdf},
year = {2003},
date = {2003-01-01},
journal = {Sensors and Actuators B: Chemical},
volume = {93},
number = {1-3},
pages = {57--66},
publisher = {Elsevier},
abstract = {This article presents a sensor excitation and signal processing approach that combines temperature modulation and transientanalysis to enhance the selectivity and sensitivity of metal-oxide gas sensors. A staircase waveform is applied to the sensor heater to extract transient information from multiple operating temperatures. Four different transientanalysis techniques, Pade–Z-transform, multi-exponential transient spectroscopy (METS), window time slicing (WTS) and a novel ridge regression solution, are evaluated on the basis of their ability to improve the sensitivity and selectivity of the sensor array. The techniques are validated on two experimental databases containing serial dilutions and mixtures of organic solvents. Our results indicate that processing of the thermal transients significantly improves the sensitivity of metal-oxide chemoresistors when compared to the quasi-stationary temperature-modulatedresponses.},
keywords = {Chemical sensors, Metal-oxide sensors, Temperature modulation},
pubstate = {published},
tppubtype = {article}
}
This article presents a sensor excitation and signal processing approach that combines temperature modulation and transientanalysis to enhance the selectivity and sensitivity of metal-oxide gas sensors. A staircase waveform is applied to the sensor heater to extract transient information from multiple operating temperatures. Four different transientanalysis techniques, Pade–Z-transform, multi-exponential transient spectroscopy (METS), window time slicing (WTS) and a novel ridge regression solution, are evaluated on the basis of their ability to improve the sensitivity and selectivity of the sensor array. The techniques are validated on two experimental databases containing serial dilutions and mixtures of organic solvents. Our results indicate that processing of the thermal transients significantly improves the sensitivity of metal-oxide chemoresistors when compared to the quasi-stationary temperature-modulatedresponses. |
Gutierrez-Galvez, A; Gutierrez-Osuna, R Pattern completion through phase coding in population neurodynamics Journal Article In: Neural networks, vol. 16, no. 5-6, pp. 649–656, 2003. @article{gutierrez2003pattern,
title = {Pattern completion through phase coding in population neurodynamics},
author = {A Gutierrez-Galvez and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2003pattern.pdf},
year = {2003},
date = {2003-01-01},
journal = {Neural networks},
volume = {16},
number = {5-6},
pages = {649--656},
publisher = {Elsevier},
abstract = {This article presents an alternative phasecoding mechanism for Freeman's KIII model of populationneurodynamics. Motivated by experimental evidence that supports the existence of a neural code based on synchronous oscillations, we propose an analogy between synchronization in neural populations and phase locking in KIII channels. An efficient method is proposed to extract phase differences across granule channels from their state-space trajectories. First, the scale invariance of the KIII model with respect to phase information is established. The phase code is then compared against the conventional amplitude code in terms of their bit-wise and across-fiber pattern recovery capabilities using decision-theoretic principles and a Hamming-distance classifier. Graph isomorphism in the Hebbian connections is exploited to perform an exhaustive evaluation of patterns on an 8-channel KIII model. Simulation results show that phase information outperforms amplitude information in the recovery of incomplete or corrupted stimuli.},
keywords = {Neuromorphic models},
pubstate = {published},
tppubtype = {article}
}
This article presents an alternative phasecoding mechanism for Freeman's KIII model of populationneurodynamics. Motivated by experimental evidence that supports the existence of a neural code based on synchronous oscillations, we propose an analogy between synchronization in neural populations and phase locking in KIII channels. An efficient method is proposed to extract phase differences across granule channels from their state-space trajectories. First, the scale invariance of the KIII model with respect to phase information is established. The phase code is then compared against the conventional amplitude code in terms of their bit-wise and across-fiber pattern recovery capabilities using decision-theoretic principles and a Hamming-distance classifier. Graph isomorphism in the Hebbian connections is exploited to perform an exhaustive evaluation of patterns on an 8-channel KIII model. Simulation results show that phase information outperforms amplitude information in the recovery of incomplete or corrupted stimuli. |
Gutierrez-Galvez, A; Gutierrez-Osuna, R Coherent oscillations as a neural code in a model of the olfactory system Conference Proceedings of the International Joint Conference on Neural Networks, IEEE 2003. @conference{gutierrez2003coherent,
title = {Coherent oscillations as a neural code in a model of the olfactory system},
author = {A Gutierrez-Galvez and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2003coherent.pdf},
year = {2003},
date = {2003-01-01},
booktitle = {Proceedings of the International Joint Conference on Neural Networks},
pages = {341--346},
organization = {IEEE},
abstract = {This paper presents an investigation of two odor-coding mechanisms in Freeman's KIII neurodynamics model. Motivated by experimental evidence that supports the existence of a neural code based on synchronous oscillations, we propose an analogy between synchronization in neural populations and phase locking in KIII channels. The information carried by the phase is compared against the conventional amplitude code in terms of pattern-recovery capabilities. First, the scalar invariance of the KIII with respect to phase information is established. Symmetries and redundancies in the associative memory matrices are then exploited to perform an exhaustive evaluation of patterns on an 8-channel model. Simulation results show that phase information outperforms amplitude information in the recovery of odor patterns from incomplete or corrupted sensory stimulus.},
keywords = {Neuromorphic models},
pubstate = {published},
tppubtype = {conference}
}
This paper presents an investigation of two odor-coding mechanisms in Freeman's KIII neurodynamics model. Motivated by experimental evidence that supports the existence of a neural code based on synchronous oscillations, we propose an analogy between synchronization in neural populations and phase locking in KIII channels. The information carried by the phase is compared against the conventional amplitude code in terms of pattern-recovery capabilities. First, the scalar invariance of the KIII with respect to phase information is established. Symmetries and redundancies in the associative memory matrices are then exploited to perform an exhaustive evaluation of patterns on an 8-channel model. Simulation results show that phase information outperforms amplitude information in the recovery of odor patterns from incomplete or corrupted sensory stimulus. |
Bryll, R; Gutierrez-Osuna, R; Quek, F Attribute bagging: improving accuracy of classifier ensembles by using random feature subsets Journal Article In: Pattern Recognition, vol. 36, no. 6, pp. 1291–1302, 2003. @article{bryll2003attribute,
title = {Attribute bagging: improving accuracy of classifier ensembles by using random feature subsets},
author = {R Bryll and R Gutierrez-Osuna and F Quek},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/bryll2003attribute-1.pdf},
year = {2003},
date = {2003-01-01},
journal = {Pattern Recognition},
volume = {36},
number = {6},
pages = {1291--1302},
publisher = {Elsevier},
abstract = {We present attribute bagging (AB), a technique for improving the accuracy and stability ofclassifierensembles induced using randomsubsets of features. AB is a wrapper method that can be used with any learning algorithm. It establishes an appropriate attributesubset size and then randomly selectssubsets of features, creating projections of the training set on which the ensembleclassifiers are built. The induced classifiers are then used for voting. This article compares the performance of our AB method with bagging and other algorithms on a hand-pose recognition dataset. It is shown that AB gives consistently better results than bagging, both in accuracy and stability. The performance of ensemble voting in bagging and the AB method as a function of the attributesubset size and the number of voters for both weighted and unweighted voting is tested and discussed. We also demonstrate that ranking the attributesubsets by their classification accuracy and voting using only the best subsets further improves the resulting performance of the ensemble.},
keywords = {Pattern recognition},
pubstate = {published},
tppubtype = {article}
}
We present attribute bagging (AB), a technique for improving the accuracy and stability ofclassifierensembles induced using randomsubsets of features. AB is a wrapper method that can be used with any learning algorithm. It establishes an appropriate attributesubset size and then randomly selectssubsets of features, creating projections of the training set on which the ensembleclassifiers are built. The induced classifiers are then used for voting. This article compares the performance of our AB method with bagging and other algorithms on a hand-pose recognition dataset. It is shown that AB gives consistently better results than bagging, both in accuracy and stability. The performance of ensemble voting in bagging and the AB method as a function of the attributesubset size and the number of voters for both weighted and unweighted voting is tested and discussed. We also demonstrate that ranking the attributesubsets by their classification accuracy and voting using only the best subsets further improves the resulting performance of the ensemble. |
Courte, D E; Rizki, M M; Tamburino, L A; Gutierrez-Osuna, R Evolutionary optimization of Gaussian windowing functions for data preprocessing Journal Article In: International Journal on Artificial Intelligence Tools, vol. 12, no. 1, pp. 17–36, 2003. @article{courte2003evolutionary,
title = {Evolutionary optimization of Gaussian windowing functions for data preprocessing},
author = {D E Courte and M M Rizki and L A Tamburino and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/courte2003evolutionary-1.pdf},
year = {2003},
date = {2003-01-01},
journal = {International Journal on Artificial Intelligence Tools},
volume = {12},
number = {1},
pages = {17--36},
publisher = {WORLD SCIENTIFIC PUBLISHING},
abstract = {The average classification accuracy of an odor classification system is improved using a genetic algorithm to determine optimal parameters for feature extraction. Gaussian windowing functions, called "kernels" are evolved to extract information from the transient response of an array of gas sensors, resulting in a reduced set of extracted features for a linear discriminant pattern classification system. Results show significant improvements are achieved when compared to results obtained using a predetermined and fixed set of four bell-shaped kernels for every sensor. Examination of the evolved kernels reveals the areas of the sensor responses where discriminating information was identified. A novel data migration approach during training helps prevent overtraining, and the fitness measure chosen incorporates adjustments for both population diversity and solution complexity. A variety of adjustable parameters, including the definition of a time-varying dynamic weighting factor, encourage experimentation in order to appropriately tune the sampling methods and fitness measure.},
keywords = {Electronic nose, Pattern recognition},
pubstate = {published},
tppubtype = {article}
}
The average classification accuracy of an odor classification system is improved using a genetic algorithm to determine optimal parameters for feature extraction. Gaussian windowing functions, called "kernels" are evolved to extract information from the transient response of an array of gas sensors, resulting in a reduced set of extracted features for a linear discriminant pattern classification system. Results show significant improvements are achieved when compared to results obtained using a predetermined and fixed set of four bell-shaped kernels for every sensor. Examination of the evolved kernels reveals the areas of the sensor responses where discriminating information was identified. A novel data migration approach during training helps prevent overtraining, and the fitness measure chosen incorporates adjustments for both population diversity and solution complexity. A variety of adjustable parameters, including the definition of a time-varying dynamic weighting factor, encourage experimentation in order to appropriately tune the sampling methods and fitness measure. |
Gutierrez-Osuna, R; Powar, N Odor mixtures and chemosensory adaptation in gas sensor arrays Journal Article In: International Journal on Artificial Intelligence Tools, vol. 12, no. 1, pp. 1–16, 2003. @article{gutierrez2003odor,
title = {Odor mixtures and chemosensory adaptation in gas sensor arrays},
author = {R Gutierrez-Osuna and N Powar},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2003odor.pdf},
year = {2003},
date = {2003-01-01},
journal = {International Journal on Artificial Intelligence Tools},
volume = {12},
number = {1},
pages = {1--16},
publisher = {WORLD SCIENTIFIC PUBLISHING},
abstract = {Inspired by the process of olfactory adaptation in biological olfactory systems, this article presents two algorithms that allow a chemical sensor array to reduce its sensitivity to odors previously detected in the environment. The first algorithm is based on a committee machine of linear discriminant functions that operate on multiple subsets of the overall sensory input. Adaptation occurs by depressing the voting strength of discriminant functions that display higher sensitivity to previously detected odors. The second algorithm is based on a topology-preserving linear projection derived from Fisher's class separability criteria. In this case, the process of adaptation is implemented through a reformulation of the between-to-within-class scatter eigenvalue problem. The proposed algorithms are validated on two datasets of binary and ternary mixtures of organic solvents using an array of temperature-modulated metal-oxide chemoresistors.},
keywords = {Metal-oxide sensors, Neuromorphic models},
pubstate = {published},
tppubtype = {article}
}
Inspired by the process of olfactory adaptation in biological olfactory systems, this article presents two algorithms that allow a chemical sensor array to reduce its sensitivity to odors previously detected in the environment. The first algorithm is based on a committee machine of linear discriminant functions that operate on multiple subsets of the overall sensory input. Adaptation occurs by depressing the voting strength of discriminant functions that display higher sensitivity to previously detected odors. The second algorithm is based on a topology-preserving linear projection derived from Fisher's class separability criteria. In this case, the process of adaptation is implemented through a reformulation of the between-to-within-class scatter eigenvalue problem. The proposed algorithms are validated on two datasets of binary and ternary mixtures of organic solvents using an array of temperature-modulated metal-oxide chemoresistors. |
Gudmundsson, K S; Awwal, A A S; Gutierrez-Osuna, R Application of phase only filters on e-nose data Conference SPIE Conference (Photonic Devices and Algorithms for Computing V), 2003. @conference{gudmundsson03phase,
title = {Application of phase only filters on e-nose data},
author = {K S Gudmundsson and A A S Awwal and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gudmundsson2003application-1.pdf},
year = {2003},
date = {2003-01-01},
booktitle = {SPIE Conference (Photonic Devices and Algorithms for Computing V)},
abstract = {A system composed of multiple sensors for data acquisition requires the analysis of multiple data signals in order to classify the input data. One such system is the electronic nose system (eNose). The eNose data is in fact 1D data from multiple data sources. However, in order to analyze and classify such data using conventional methods such as Linear Discriminant Analysis (LDA), Principal Component Analysis (PCA), or the K Nearest Neighbors (KNN) requires much computational power. In this research data from such system will be analyzed and classified using the POF.},
keywords = {Electronic nose},
pubstate = {published},
tppubtype = {conference}
}
A system composed of multiple sensors for data acquisition requires the analysis of multiple data signals in order to classify the input data. One such system is the electronic nose system (eNose). The eNose data is in fact 1D data from multiple data sources. However, in order to analyze and classify such data using conventional methods such as Linear Discriminant Analysis (LDA), Principal Component Analysis (PCA), or the K Nearest Neighbors (KNN) requires much computational power. In this research data from such system will be analyzed and classified using the POF. |
2002
|
Nagle, H T; Gutierrez-Osuna, R; Kermani, B; Schiffman, S S Environmental monitoring Book Chapter In: Handbook of Machine Olfaction, pp. 419–444, Wiley Online Library, 2002. @inbook{nagle2003environmental,
title = {Environmental monitoring},
author = {H T Nagle and R Gutierrez-Osuna and B Kermani and S S Schiffman},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/nagle2003environmental.pdf},
year = {2002},
date = {2002-01-01},
booktitle = {Handbook of Machine Olfaction},
pages = {419--444},
publisher = {Wiley Online Library},
abstract = {In this chapter, we review some of the previous proof-of-principle work done in this field. Examples of water, land and air monitoring experiments are examined. Four case studies are then presented. The first three demonstrate the ability of the e-nose to classify odors from animal confinement facilities (odor source determination, odorant threshold detection, and odor abatement evaluation). The fourth case study demonstrates that the e-nose can differentiate between five types of fungi that commonly lower indoor air quality in office buildings and industrial plants. Finally, we conclude that environmental monitoring is a promising application area for electronic nose technology.},
keywords = {Machine olfaction},
pubstate = {published},
tppubtype = {inbook}
}
In this chapter, we review some of the previous proof-of-principle work done in this field. Examples of water, land and air monitoring experiments are examined. Four case studies are then presented. The first three demonstrate the ability of the e-nose to classify odors from animal confinement facilities (odor source determination, odorant threshold detection, and odor abatement evaluation). The fourth case study demonstrates that the e-nose can differentiate between five types of fungi that commonly lower indoor air quality in office buildings and industrial plants. Finally, we conclude that environmental monitoring is a promising application area for electronic nose technology. |
Schiffman, S S; Gutierrez-Osuna, R; Nagle, H T Measuring odor intensity with e-noses and other sensor types Conference Proceedings of the 9th International Symposium on Olfaction and Electronic Nose, 2002. @conference{schiffman2002measuring,
title = {Measuring odor intensity with e-noses and other sensor types},
author = {S S Schiffman and R Gutierrez-Osuna and H T Nagle},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/schiffman2002measuring.pdf},
year = {2002},
date = {2002-01-01},
booktitle = {Proceedings of the 9th International Symposium on Olfaction and Electronic Nose},
pages = {68--72},
abstract = {This paper addresses the problem of predicting human olfactory ratings from instrumental measurements. Specifically, the paper analyzes the ability of two commercially-available electronic nose instruments (the NST 3320 and the Cyranose® 320) and three other sensing devices (a photoionization detector, a gold-film sulfur sensor, and an infrared laser detector) to match the performance of the human olfactory system in measuring odor intensity in a variety of realistic situations. These initial studies offer encouraging results for the two e-nose instruments, the PID, and the Au-film sensor.},
keywords = {Electronic nose},
pubstate = {published},
tppubtype = {conference}
}
This paper addresses the problem of predicting human olfactory ratings from instrumental measurements. Specifically, the paper analyzes the ability of two commercially-available electronic nose instruments (the NST 3320 and the Cyranose® 320) and three other sensing devices (a photoionization detector, a gold-film sulfur sensor, and an infrared laser detector) to match the performance of the human olfactory system in measuring odor intensity in a variety of realistic situations. These initial studies offer encouraging results for the two e-nose instruments, the PID, and the Au-film sensor. |
Gutierrez-Osuna, R; Gutierrez-Galvez, A Habituation in the KIII olfactory model using gas sensor arrays Conference Proceedings of the 9th International Symposium on Olfaction and Electronic Nose, 2002. @conference{gutierrez2002habituation,
title = {Habituation in the KIII olfactory model using gas sensor arrays},
author = {R Gutierrez-Osuna and A Gutierrez-Galvez},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2002habituation.pdf},
year = {2002},
date = {2002-01-01},
booktitle = {Proceedings of the 9th International Symposium on Olfaction and Electronic Nose},
pages = {171--173},
abstract = {Inspired by the habituation process in the olfactory system, this article presents an approach for analyzing electronic-nose data using Freeman’s KIII neurodynamics model. In order to ensure the additivity of patterns from odor mixtures, input data from a gas sensor array is first processed with a family of discriminant functions that yield an orthogonal binary representation. The process of habituation is then simulated through synaptic depression with a decay term that reduces the strength of mitral and granule connections when the KIII model is excited with a continuous stimulus. As a result, the system is able to mimic the effects of habituation when processing odor mixtures with gas sensor arrays.},
keywords = {Metal-oxide sensors, Neuromorphic models},
pubstate = {published},
tppubtype = {conference}
}
Inspired by the habituation process in the olfactory system, this article presents an approach for analyzing electronic-nose data using Freeman’s KIII neurodynamics model. In order to ensure the additivity of patterns from odor mixtures, input data from a gas sensor array is first processed with a family of discriminant functions that yield an orthogonal binary representation. The process of habituation is then simulated through synaptic depression with a decay term that reduces the strength of mitral and granule connections when the KIII model is excited with a continuous stimulus. As a result, the system is able to mimic the effects of habituation when processing odor mixtures with gas sensor arrays. |
Gutierrez-Osuna, R; Sun, P A biologically-plausible computational architecture for sensor-based machine olfaction Conference Proceedings of the ninth International Symposium on Olfaction and Electronic Nose, 2002. @conference{gutierrez2002biologically,
title = {A biologically-plausible computational architecture for sensor-based machine olfaction},
author = {R Gutierrez-Osuna and P Sun},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2002biologically.pdf},
year = {2002},
date = {2002-01-01},
booktitle = {Proceedings of the ninth International Symposium on Olfaction and Electronic Nose},
pages = {57--59},
abstract = {This article presents a computational architecture for sensor-based machine olfaction based on biologically plausible models of the early stages in the olfactory pathway. We derive a concentration-response model that maps conventional sensor-array patterns into activation patterns for a population of olfactory receptor neurons (ORNs). A chemotopic convergence model is employed to generate spatial activation patterns at the glomerular layer that are consistent with neurobiology. These glomerular images serve as inputs to an implementation of Freeman’s KIII neurodynamics model.},
keywords = {Machine olfaction, Neuromorphic models},
pubstate = {published},
tppubtype = {conference}
}
This article presents a computational architecture for sensor-based machine olfaction based on biologically plausible models of the early stages in the olfactory pathway. We derive a concentration-response model that maps conventional sensor-array patterns into activation patterns for a population of olfactory receptor neurons (ORNs). A chemotopic convergence model is employed to generate spatial activation patterns at the glomerular layer that are consistent with neurobiology. These glomerular images serve as inputs to an implementation of Freeman’s KIII neurodynamics model. |
Perera-Lluna, A; Sundic, T; Pardo, A; Gutierrez-Osuna, R; Marco, S A portable electronic nose based on embedded PC technology and GNU/Linux: Hardware, software and applications Journal Article In: Sensors Journal, IEEE, vol. 2, no. 3, pp. 235–246, 2002. @article{perera2002portable,
title = {A portable electronic nose based on embedded PC technology and GNU/Linux: Hardware, software and applications},
author = {A Perera-Lluna and T Sundic and A Pardo and R Gutierrez-Osuna and S Marco},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/perera2002portable.pdf},
year = {2002},
date = {2002-01-01},
journal = {Sensors Journal, IEEE},
volume = {2},
number = {3},
pages = {235--246},
publisher = {IEEE},
abstract = {This paper describes a portable electronic nose based on embedded PC technology. The instrument combines a small footprint with the versatility offered by embedded technology in terms of software development and digital communications services. A summary of the proposed hardware and software solutions is provided with an emphasis on data processing. Data evaluation procedures available in the instrument include automatic feature selection by means of SFFS, feature extraction with linear discriminant analysis (LDA) and principal component analysis (PCA), multi-component analysis with partial least squares (PLS) and classification through k-NN and Gaussian mixture models. In terms of instrumentation, the instrument makes use of temperature modulation to improve the selectivity of commercial metal oxide gas sensors. Field applications of the instrument, including experimental results, are also presented.},
keywords = {Electronic nose, Metal-oxide sensors},
pubstate = {published},
tppubtype = {article}
}
This paper describes a portable electronic nose based on embedded PC technology. The instrument combines a small footprint with the versatility offered by embedded technology in terms of software development and digital communications services. A summary of the proposed hardware and software solutions is provided with an emphasis on data processing. Data evaluation procedures available in the instrument include automatic feature selection by means of SFFS, feature extraction with linear discriminant analysis (LDA) and principal component analysis (PCA), multi-component analysis with partial least squares (PLS) and classification through k-NN and Gaussian mixture models. In terms of instrumentation, the instrument makes use of temperature modulation to improve the selectivity of commercial metal oxide gas sensors. Field applications of the instrument, including experimental results, are also presented. |
Gutierrez-Osuna, R Pattern analysis for machine olfaction: a review Journal Article In: Sensors Journal, IEEE, vol. 2, no. 3, pp. 189–202, 2002. @article{gutierrezosuna2002sj,
title = {Pattern analysis for machine olfaction: a review},
author = {R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrezosuna2002sj.pdf},
year = {2002},
date = {2002-01-01},
journal = {Sensors Journal, IEEE},
volume = {2},
number = {3},
pages = {189--202},
publisher = {IEEE},
abstract = {Pattern analysis constitutes a critical building block in the development of gas sensor array instruments capable of detecting, identifying, and measuring volatile compounds, a technology that has been proposed as an artificial substitute for the human olfactory system. The successful design of a pattern analysis system for machine olfaction requires a careful consideration of the various issues involved in processing multivariate data: signal-preprocessing, feature extraction, feature selection, classification, regression, clustering, and validation. A considerable number of methods from statistical pattern recognition, neural networks, chemometrics, machine learning, and biological cybernetics have been used to process electronic nose data. The objective of this review paper is to provide a summary and guidelines for using the most widely used pattern analysis techniques, as well as to identify research directions that are at the frontier of sensor-based machine olfaction.},
keywords = {Machine olfaction},
pubstate = {published},
tppubtype = {article}
}
Pattern analysis constitutes a critical building block in the development of gas sensor array instruments capable of detecting, identifying, and measuring volatile compounds, a technology that has been proposed as an artificial substitute for the human olfactory system. The successful design of a pattern analysis system for machine olfaction requires a careful consideration of the various issues involved in processing multivariate data: signal-preprocessing, feature extraction, feature selection, classification, regression, clustering, and validation. A considerable number of methods from statistical pattern recognition, neural networks, chemometrics, machine learning, and biological cybernetics have been used to process electronic nose data. The objective of this review paper is to provide a summary and guidelines for using the most widely used pattern analysis techniques, as well as to identify research directions that are at the frontier of sensor-based machine olfaction. |
Gutierrez-Osuna, R A self-organizing model of chemotopic convergence for olfactory coding Conference Proceedings of the 2nd Joint EMBS-BMES Conference, vol. 1, IEEE 2002. @conference{gutierrez2002self,
title = {A self-organizing model of chemotopic convergence for olfactory coding},
author = {R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2002self.pdf},
year = {2002},
date = {2002-01-01},
booktitle = {Proceedings of the 2nd Joint EMBS-BMES Conference},
volume = {1},
pages = {236--237},
organization = {IEEE},
abstract = {Presents a self-organizing model of convergence for the early stages of the olfactory pathway. The model generates a chemotopic projection from olfactory receptor neurons onto glomeruli based on receptor affinity distributions. The resulting glomerular images reveal an olfactory code consistent with neurobiology, whereby odor quality is encoded by a unique spatial pattern across glomeruli, and odor concentration is related to the intensity and spread of this pattern. The model is also able to predict a broadening of the intensity tuning range of glomeruli.},
keywords = {Neuromorphic models},
pubstate = {published},
tppubtype = {conference}
}
Presents a self-organizing model of convergence for the early stages of the olfactory pathway. The model generates a chemotopic projection from olfactory receptor neurons onto glomeruli based on receptor affinity distributions. The resulting glomerular images reveal an olfactory code consistent with neurobiology, whereby odor quality is encoded by a unique spatial pattern across glomeruli, and odor concentration is related to the intensity and spread of this pattern. The model is also able to predict a broadening of the intensity tuning range of glomeruli. |
Gutierrez-Osuna, R; Nagle, H T; Kermani, B; Schiffman, S S Signal conditioning and preprocessing Book Chapter In: Handbook of Machine Olfaction, pp. 105–132, Wiley Online Library, 2002. @inbook{gutierrez2002signal,
title = {Signal conditioning and preprocessing},
author = {R Gutierrez-Osuna and H T Nagle and B Kermani and S S Schiffman},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2002signal.pdf},
year = {2002},
date = {2002-01-01},
booktitle = {Handbook of Machine Olfaction},
pages = {105--132},
publisher = {Wiley Online Library},
abstract = {The topics covered in this chapter establish the connection between gas sensors and pattern recognition, the two fundamental modules of an odor-sensing instrument that are covered in Chapters 6 and 8, respectively. A number of electronic circuits are involved in integrating pattern analysis algorithms with the underlying chemical transduction mechanisms, as shown in Figure 1. First, the response of the odor sensors (e.g. a resistance change) needs to be measured and converted into an electrical signal (e.g. a voltage). This operation is performed by means of interface circuits. Second, the electrical signal undergoes analog conditioning (e.g. filtering) to enhance its information content. Third, the analog signal is sampled, digitized and stored in computer memory (not covered in this chapter due to space constraints). Finally, the sampled signal is digitally pre-processed (e.g. autoscaling) in order to make it suitable for pattern analysis. This chapter is organized in three basic parts: interface circuits, signal conditioning and preprocessing. Section 2 presents the fundamental interface circuits for the three primary odor sensor types: resistive, piezoelectric and field-effect. Section 3 reviews the primary functions performed by analog signal conditioning circuits. Section 4 covers data pre-processing, the first stage of digital signal processing. The issue of sensor and instrumentation noise, one of the most important factors determining electronic-nose performance, is also reviewed in section 5. The chapter concludes with a review of current instrumentation trends aimed at increasing the selectivity of odor sensor systems.},
keywords = {Machine olfaction},
pubstate = {published},
tppubtype = {inbook}
}
The topics covered in this chapter establish the connection between gas sensors and pattern recognition, the two fundamental modules of an odor-sensing instrument that are covered in Chapters 6 and 8, respectively. A number of electronic circuits are involved in integrating pattern analysis algorithms with the underlying chemical transduction mechanisms, as shown in Figure 1. First, the response of the odor sensors (e.g. a resistance change) needs to be measured and converted into an electrical signal (e.g. a voltage). This operation is performed by means of interface circuits. Second, the electrical signal undergoes analog conditioning (e.g. filtering) to enhance its information content. Third, the analog signal is sampled, digitized and stored in computer memory (not covered in this chapter due to space constraints). Finally, the sampled signal is digitally pre-processed (e.g. autoscaling) in order to make it suitable for pattern analysis. This chapter is organized in three basic parts: interface circuits, signal conditioning and preprocessing. Section 2 presents the fundamental interface circuits for the three primary odor sensor types: resistive, piezoelectric and field-effect. Section 3 reviews the primary functions performed by analog signal conditioning circuits. Section 4 covers data pre-processing, the first stage of digital signal processing. The issue of sensor and instrumentation noise, one of the most important factors determining electronic-nose performance, is also reviewed in section 5. The chapter concludes with a review of current instrumentation trends aimed at increasing the selectivity of odor sensor systems. |
Rodríguez-Méndez, M L; Arrieta, A; Parra, V; Vegas, A; Villanueva, S; Gutierrez-Osuna, R; de Saja, J A Sensor system for the complete organoleptic characterization (smell, taste and color) of wines Conference Proceedings of the 9th International Symposium on Olfaction and Electronic Nose, 2002. @conference{mendez01organoleptic,
title = {Sensor system for the complete organoleptic characterization (smell, taste and color) of wines},
author = {M L Rodríguez-Méndez and A Arrieta and V Parra and A Vegas and S Villanueva and R Gutierrez-Osuna and J A de Saja},
year = {2002},
date = {2002-01-01},
booktitle = {Proceedings of the 9th International Symposium on Olfaction and Electronic Nose},
keywords = {Chemical sensors},
pubstate = {published},
tppubtype = {conference}
}
|
Gutierrez-Osuna, R; Gutierrez-Galvez, A; Powar, N Transient Response Analysis for Temperature Modulated Chemoresistors Conference Proceedings of the 9th International Meeting on Chemical Sensors, 2002. @conference{gutierrez2002transient,
title = {Transient Response Analysis for Temperature Modulated Chemoresistors},
author = {R Gutierrez-Osuna and A Gutierrez-Galvez and N Powar},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2002transient.pdf},
year = {2002},
date = {2002-01-01},
booktitle = {Proceedings of the 9th International Meeting on Chemical Sensors},
keywords = {Chemical sensors, Metal-oxide sensors, Temperature modulation},
pubstate = {published},
tppubtype = {conference}
}
|
2001
|
Perera-Lluna, A; Pardo, T; Sundic, T; Marco, S; Gutierrez-Osuna, R IpNose: Electronic nose for distributed air quality monitoring system Conference Proceedings of the 3rd European Congress on Odours, Metrology and Electronic Noses, 2001. @conference{perera2001airquality,
title = {IpNose: Electronic nose for distributed air quality monitoring system},
author = {A Perera-Lluna and T Pardo and T Sundic and S Marco and R Gutierrez-Osuna},
year = {2001},
date = {2001-06-19},
booktitle = {Proceedings of the 3rd European Congress on Odours, Metrology and Electronic Noses},
abstract = {Electronic noses are intelligent instruments that are able to classify and quantify different gas/odours. Here we suggest the integration of a small form factor computer inside the electronic nose. This concept allows us to easily provide remote connectivity, large data storage and complex signal processing. The evolution of this technology will permit distributed sensing with applications to agriculture and environment. Proposed instrument allows incoming connections for remote control of bad odours in landfill sites. Preliminary approach to this application using commercial sensors and mixture model pattern recognition scheme is exposed.},
keywords = {Electronic nose},
pubstate = {published},
tppubtype = {conference}
}
Electronic noses are intelligent instruments that are able to classify and quantify different gas/odours. Here we suggest the integration of a small form factor computer inside the electronic nose. This concept allows us to easily provide remote connectivity, large data storage and complex signal processing. The evolution of this technology will permit distributed sensing with applications to agriculture and environment. Proposed instrument allows incoming connections for remote control of bad odours in landfill sites. Preliminary approach to this application using commercial sensors and mixture model pattern recognition scheme is exposed. |
Perera-Lluna, A; Gutierrez-Osuna, R; Marco, S ipNOSE: A portable volatile analyzer based on embedded technology for intensive computation and time dependent signal processing Conference Proceedings of the 8th International Symposium on Olfaction and the Electronic Nose, 2001. @conference{perera2001volatile,
title = {ipNOSE: A portable volatile analyzer based on embedded technology for intensive computation and time dependent signal processing},
author = {A Perera-Lluna and R Gutierrez-Osuna and S Marco},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/perera2001volatile.pdf},
year = {2001},
date = {2001-03-25},
booktitle = {Proceedings of the 8th International Symposium on Olfaction and the Electronic Nose},
abstract = {Most electronic noses need a computer and special software in order to analyze data from sensors. In the case of portable electronic noses, most of them are operated by microcontrollers with limited data storage (usually feature vectors) and simple signal processing capabilities. Here we suggest the integration of a small form factor computer inside the electronic nose. This concept allows us to easily perform temperature modulation over metal oxide sensors, remote connectivity under TCP/IP networking, large data storage and complex signal processing.},
keywords = {Electronic nose, Metal-oxide sensors},
pubstate = {published},
tppubtype = {conference}
}
Most electronic noses need a computer and special software in order to analyze data from sensors. In the case of portable electronic noses, most of them are operated by microcontrollers with limited data storage (usually feature vectors) and simple signal processing capabilities. Here we suggest the integration of a small form factor computer inside the electronic nose. This concept allows us to easily perform temperature modulation over metal oxide sensors, remote connectivity under TCP/IP networking, large data storage and complex signal processing. |
Kakumanu, P; Gutierrez-Osuna, R; Esposito, A; Bryll, R; Goshtasby, A; Garcia, ON Speech driven facial animation Conference Proceedings of the 2001 workshop on Perceptive user interfaces, ACM 2001. @conference{kakumanu2001speech,
title = {Speech driven facial animation},
author = {P Kakumanu and R Gutierrez-Osuna and A Esposito and R Bryll and A Goshtasby and ON Garcia},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/kakumanu2001speech.pdf},
year = {2001},
date = {2001-01-01},
booktitle = {Proceedings of the 2001 workshop on Perceptive user interfaces},
pages = {1--5},
organization = {ACM},
abstract = {The results reported in this article are an integral part of a larger project aimed at achieving perceptually realistic animations, including the individualized nuances, of three-dimensional human faces driven by speech. The audiovisual system that has been developed for learning the spatio-temporal relationship between speech acoustics and facial animation is described, including video and speech processing, pattern analysis, and MPEG-4 compliant facial animation for a given speaker. In particular, we propose a perceptual transformation of the speech spectral envelope, which is shown to capture the dynamics of articulatory movements. An efficient nearest-neighbor algorithm is used to predict novel articulatory trajectories from the speech dynamics. The results are very promising and suggest a new way to approach the modeling of synthetic lip motion of a given speaker driven by his/her speech. This would also provide clues toward a more general cross-speaker realistic animation.},
keywords = {Facial animation, Speech},
pubstate = {published},
tppubtype = {conference}
}
The results reported in this article are an integral part of a larger project aimed at achieving perceptually realistic animations, including the individualized nuances, of three-dimensional human faces driven by speech. The audiovisual system that has been developed for learning the spatio-temporal relationship between speech acoustics and facial animation is described, including video and speech processing, pattern analysis, and MPEG-4 compliant facial animation for a given speaker. In particular, we propose a perceptual transformation of the speech spectral envelope, which is shown to capture the dynamics of articulatory movements. An efficient nearest-neighbor algorithm is used to predict novel articulatory trajectories from the speech dynamics. The results are very promising and suggest a new way to approach the modeling of synthetic lip motion of a given speaker driven by his/her speech. This would also provide clues toward a more general cross-speaker realistic animation. |
Gutierrez-Osuna, R; Powar, N; Sun, P Chemosensory adaptation in an electronic nose Conference Proceedings of the 2nd IEEE International Symposium on Bioinformatics and Bioengineering Conference, IEEE 2001. @conference{gutierrez2001chemosensory,
title = {Chemosensory adaptation in an electronic nose},
author = {R Gutierrez-Osuna and N Powar and P Sun},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2001chemosensory.pdf},
year = {2001},
date = {2001-01-01},
booktitle = {Proceedings of the 2nd IEEE International Symposium on Bioinformatics and Bioengineering Conference},
pages = {223--229},
organization = {IEEE},
abstract = {This article presents a computational mechanism inspired by the process of chemosensory adaptation in the mammalian olfactory system. The algorithm operates on multiple subsets of the sensory space, generating a family of discriminant functions for different volatile compounds. A set of selectivity coefficients is associated to each discriminant function on the basis of its behavior in the presence of mixtures. These coefficients are employed to form a weighted average of the discriminant functions and establish a feedback signal that reduces the contribution of certain sensory inputs, inhibiting the overall selectivity of the system to previously detected analytes. The algorithm is validated on a database of organic solvents using an array of temperature-modulated metal-oxide chemoresistors.},
keywords = {Chemical sensors, Electronic nose, Metal-oxide sensors, Neuromorphic models, Temperature modulation},
pubstate = {published},
tppubtype = {conference}
}
This article presents a computational mechanism inspired by the process of chemosensory adaptation in the mammalian olfactory system. The algorithm operates on multiple subsets of the sensory space, generating a family of discriminant functions for different volatile compounds. A set of selectivity coefficients is associated to each discriminant function on the basis of its behavior in the presence of mixtures. These coefficients are employed to form a weighted average of the discriminant functions and establish a feedback signal that reduces the contribution of certain sensory inputs, inhibiting the overall selectivity of the system to previously detected analytes. The algorithm is validated on a database of organic solvents using an array of temperature-modulated metal-oxide chemoresistors. |
Gutierrez-Osuna, R; Schiffman, S S; Nagle, H T Correlation of sensory analysis with electronic nose data for swine odor remediation assessment Conference Proceedings of the 3rd European Congress on Odours, Metrology and Electronic Noses, 2001. @conference{gutierrez2001correlation,
title = {Correlation of sensory analysis with electronic nose data for swine odor remediation assessment},
author = {R Gutierrez-Osuna and S S Schiffman and H T Nagle},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2001correlation.pdf},
year = {2001},
date = {2001-01-01},
booktitle = {Proceedings of the 3rd European Congress on Odours, Metrology and Electronic Noses},
abstract = {This article presents an evaluation of the electronic nose technology as an alternative to sensory analysis for assessing the effectiveness of biofilters. An AromaScan® A32S electronic nose and a human panel at Duke University’s Taste and Smell Research Lab were used to measure typical volatile compounds from swine confinement buildings. Chemometrics techniques were employed to predict the olfactory scores of the human panel from the electronic nose data. The cross-sensitivity of the sensor array to the humidity of the samples is discussed. Our results indicate that the electronic nose generates responses that are correlated with sensory analysis ratings of swine malodors at different concentrations.},
keywords = {Electronic nose, Olfaction},
pubstate = {published},
tppubtype = {conference}
}
This article presents an evaluation of the electronic nose technology as an alternative to sensory analysis for assessing the effectiveness of biofilters. An AromaScan® A32S electronic nose and a human panel at Duke University’s Taste and Smell Research Lab were used to measure typical volatile compounds from swine confinement buildings. Chemometrics techniques were employed to predict the olfactory scores of the human panel from the electronic nose data. The cross-sensitivity of the sensor array to the humidity of the samples is discussed. Our results indicate that the electronic nose generates responses that are correlated with sensory analysis ratings of swine malodors at different concentrations. |
Perera-Lluna, A; Pardo, T; Sundi, T; Gutierrez-Osuna, R; Marco, S; Nicolas, J IpNose: Electronic nose for remote bad odour monitoring system in landfill sites Conference Proceedings of the 8th conference EURODEUR, 2001. @conference{perera2001ipnose,
title = {IpNose: Electronic nose for remote bad odour monitoring system in landfill sites},
author = {A Perera-Lluna and T Pardo and T Sundi and R Gutierrez-Osuna and S Marco and J Nicolas},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/perera2001ipnose.pdf},
year = {2001},
date = {2001-01-01},
booktitle = {Proceedings of the 8th conference EURODEUR},
pages = {19--21},
abstract = {Electronic noses are intelligent instruments that are able to classify and quantify different gas/odours. Here we suggest the integration of a small form factor computer inside the electronic nose. This concept allows us to easily provide remote connectivity, large data storage and complex signal processing. The evolution of this technology will permit distributed sensing with applications to agriculture and environment. Proposed instrument allows incoming connections for remote control of bad odours in landfill sites. Preliminary approach to this application using commercial sensors and mixture model pattern recognition scheme is exposed.},
keywords = {Electronic nose},
pubstate = {published},
tppubtype = {conference}
}
Electronic noses are intelligent instruments that are able to classify and quantify different gas/odours. Here we suggest the integration of a small form factor computer inside the electronic nose. This concept allows us to easily provide remote connectivity, large data storage and complex signal processing. The evolution of this technology will permit distributed sensing with applications to agriculture and environment. Proposed instrument allows incoming connections for remote control of bad odours in landfill sites. Preliminary approach to this application using commercial sensors and mixture model pattern recognition scheme is exposed. |
Schiffman, S S; Gutierrez-Osuna, R; Nagle, H T Use of an electronic nose to evaluate odors from swine operations Conference Proceedings of the 8th International Symposium on Olfaction and Electronic Nose, 2001. @conference{schiffman2001use,
title = {Use of an electronic nose to evaluate odors from swine operations},
author = {S S Schiffman and R Gutierrez-Osuna and H T Nagle},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/schiffman2001use.pdf},
year = {2001},
date = {2001-01-01},
booktitle = {Proceedings of the 8th International Symposium on Olfaction and Electronic Nose},
abstract = {In this project, an AromaScan A32S electronic nose and a human panel at the Duke Taste and Smell Lab were used to evaluate the effectiveness of biofilters in reducing the malodors in the exhaust air from swine confinement facilities. Three experiments are reported: 1) detection threshold tests for the electronic nose and human panel for a significant component of swine slurry – acetic acid, 2) hedonic tone evaluation by the human panel and electronic nose in a benchtop biofilter setup for an synthetic swine slurry, and 3) field test of the electronic nose in an operational biofilter at a swine production facility. The feasibility of using an electronic nose to replace the human panel in these applications is demonstrated.},
keywords = {Electronic nose},
pubstate = {published},
tppubtype = {conference}
}
In this project, an AromaScan A32S electronic nose and a human panel at the Duke Taste and Smell Lab were used to evaluate the effectiveness of biofilters in reducing the malodors in the exhaust air from swine confinement facilities. Three experiments are reported: 1) detection threshold tests for the electronic nose and human panel for a significant component of swine slurry – acetic acid, 2) hedonic tone evaluation by the human panel and electronic nose in a benchtop biofilter setup for an synthetic swine slurry, and 3) field test of the electronic nose in an operational biofilter at a swine production facility. The feasibility of using an electronic nose to replace the human panel in these applications is demonstrated. |
Gutierrez-Osuna, R; Korah, S; Perera, A Multi-frequency temperature modulation for metal-oxide gas sensors Conference Proceedings of the 8th International Symposium on Olfaction and the Electronic Nose, 2001. @conference{gutierrez2001multi,
title = {Multi-frequency temperature modulation for metal-oxide gas sensors},
author = {R Gutierrez-Osuna and S Korah and A Perera},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2001multi.pdf},
year = {2001},
date = {2001-01-01},
booktitle = {Proceedings of the 8th International Symposium on Olfaction and the Electronic Nose},
pages = {212--218},
abstract = {This article presents a multi-frequency approach to temperature modulation for commercial metal-oxide gas sensors. The heating element is excited with a sinusoidal waveform at different frequencies ranging from 0.125 to 4 Hz, as well as DC. Experimental results on five compounds yield 100% classification rate on temperature-modulated responses, in comparison with 50-60% for DC-heated responses.},
keywords = {Chemical sensors, Metal-oxide sensors, Temperature modulation},
pubstate = {published},
tppubtype = {conference}
}
This article presents a multi-frequency approach to temperature modulation for commercial metal-oxide gas sensors. The heating element is excited with a sinusoidal waveform at different frequencies ranging from 0.125 to 4 Hz, as well as DC. Experimental results on five compounds yield 100% classification rate on temperature-modulated responses, in comparison with 50-60% for DC-heated responses. |
Garcia, O N; Gutierrez-Osuna, R An Updated Approach to Complexity from an Agent-Centered Artificial Intelligence Perspective Book Chapter In: Encyclopedia of Library and Information Science (ELIS), vol. 68, pp. 346-366, 2001. @inbook{garcia2001complexity,
title = {An Updated Approach to Complexity from an Agent-Centered Artificial Intelligence Perspective},
author = {O N Garcia and R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/garcia2001complexity.pdf},
year = {2001},
date = {2001-01-01},
booktitle = {Encyclopedia of Library and Information Science (ELIS)},
volume = {68},
pages = {346-366},
abstract = {Here we update and expand our previous work to find commonality in a variety of systems, situations, and organisms with regard to a generic concept of complexity (1). Such attempts have drawn significant attention from outstanding researchers of diverse backgrounds (2). Despite years of research with many papers written, there is yet to appear a convergence toward a unified methodology in the multi-disciplinary approaches. In particular, we consider how the synthesis of complex systems, as is practiced in the software engineering of large systems, sheds light on the analysis of complexity. We consider how levels of abstraction at different granularities relate to complexity from the point of view of the description of a model of the system. We consider also the relationship of an intelligent agent, symbolic or biological, with the estimation of complexity. We use the term agent to include both intelligent programs and humans, which learn systems (models) from observations and adapt to their environment by learning. It is suggested here that an agent-centered approach, factoring complexity modulo a context (called in Artificial Intelligence a perspective), may provide a more general approach to determining the complexity of an object or system. The thesis presented here is that the object must not be considered independently from its user agent and its context and that in the duality of the consideration, one may learn more about both the general characteristics of complexity and of the specific reasons for our interest in it. The proposal is to consider user, interaction, and the related interfaces simultaneously when studying the complexity of a system. This approach is more integrative and less reductionist than studying any of the system aspects individually and bridges the difficulties of a large range of diverse settings. An overview of the field is briefly presented in light of the proposed approach.},
keywords = {Other},
pubstate = {published},
tppubtype = {inbook}
}
Here we update and expand our previous work to find commonality in a variety of systems, situations, and organisms with regard to a generic concept of complexity (1). Such attempts have drawn significant attention from outstanding researchers of diverse backgrounds (2). Despite years of research with many papers written, there is yet to appear a convergence toward a unified methodology in the multi-disciplinary approaches. In particular, we consider how the synthesis of complex systems, as is practiced in the software engineering of large systems, sheds light on the analysis of complexity. We consider how levels of abstraction at different granularities relate to complexity from the point of view of the description of a model of the system. We consider also the relationship of an intelligent agent, symbolic or biological, with the estimation of complexity. We use the term agent to include both intelligent programs and humans, which learn systems (models) from observations and adapt to their environment by learning. It is suggested here that an agent-centered approach, factoring complexity modulo a context (called in Artificial Intelligence a perspective), may provide a more general approach to determining the complexity of an object or system. The thesis presented here is that the object must not be considered independently from its user agent and its context and that in the duality of the consideration, one may learn more about both the general characteristics of complexity and of the specific reasons for our interest in it. The proposal is to consider user, interaction, and the related interfaces simultaneously when studying the complexity of a system. This approach is more integrative and less reductionist than studying any of the system aspects individually and bridges the difficulties of a large range of diverse settings. An overview of the field is briefly presented in light of the proposed approach. |
2000
|
Gutierrez-Osuna, R; Garcia, O N An application of Rissanen’s Complexity Measure to Optimizing Abstraction Level Conference Proceedings of the 5th Annual Conference on Human Interaction with Complex Systems, 2000. @conference{gutierrezapplication,
title = {An application of Rissanen’s Complexity Measure to Optimizing Abstraction Level},
author = {R Gutierrez-Osuna and O N Garcia},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2000application.pdf},
year = {2000},
date = {2000-05-02},
booktitle = {Proceedings of the 5th Annual Conference on Human Interaction with Complex Systems},
abstract = {In previous work we have considered the usercentered complexity of a hierarchy of abstractions as observed from a user’s perspective. We hypothesized that, given a perspective, there should be a variety of complexities depending on the granularity of the abstraction and the measure of complexity chosen. In this paper we consider an optimization based on the Minimum Description Length complexity measure and its implications for choosing the proper level of abstraction.},
keywords = {Other},
pubstate = {published},
tppubtype = {conference}
}
In previous work we have considered the usercentered complexity of a hierarchy of abstractions as observed from a user’s perspective. We hypothesized that, given a perspective, there should be a variety of complexities depending on the granularity of the abstraction and the measure of complexity chosen. In this paper we consider an optimization based on the Minimum Description Length complexity measure and its implications for choosing the proper level of abstraction. |
Gutierrez-Osuna, R Drift reduction for metal-oxide sensor arrays using canonical correlation regression and partial least squares Conference Proceedings of the 7th International Symposium On Olfaction & Electronic Nose, 2000. @conference{gutierrez2000drift,
title = {Drift reduction for metal-oxide sensor arrays using canonical correlation regression and partial least squares},
author = {R Gutierrez-Osuna},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez2000drift.pdf},
year = {2000},
date = {2000-01-01},
booktitle = {Proceedings of the 7th International Symposium On Olfaction & Electronic Nose},
journal = {Electronic Noses and Olfaction 2000},
abstract = {The transient response of metal-oxide sensors exposed to mild odours can be oftentimes highly correlated with the behaviour of the array during the preceding wash and reference cycles. Since wash/reference gases are virtually constant overtime, variations in their transient response can be used to estimate the amount of sensor drift present in each experiment. We perform canonical correlation analysis and partial least squares to find a subset of “latent variables” that summarize the linear dependencies between odour and wash/reference responses. Ordinary least squares regression is then used to subtract these “latent variables” from the odour response. Experimental results on an odour database of four cooking spices, collected on a 10-sensor array over a period of three months, show significant improvements in predictive accuracy.},
keywords = {Metal-oxide sensors},
pubstate = {published},
tppubtype = {conference}
}
The transient response of metal-oxide sensors exposed to mild odours can be oftentimes highly correlated with the behaviour of the array during the preceding wash and reference cycles. Since wash/reference gases are virtually constant overtime, variations in their transient response can be used to estimate the amount of sensor drift present in each experiment. We perform canonical correlation analysis and partial least squares to find a subset of “latent variables” that summarize the linear dependencies between odour and wash/reference responses. Ordinary least squares regression is then used to subtract these “latent variables” from the odour response. Experimental results on an odour database of four cooking spices, collected on a 10-sensor array over a period of three months, show significant improvements in predictive accuracy. |
Schiffman, S S; Wyrick, D; Gutierrez-Osuna, R; Nagle, H T Effectiveness of an electronic nose for monitoring bacterial and fungal growth Conference Proceedings of the 7th International Symposium On Olfaction & Electronic Nose, 2000. @conference{schiffman2000effectiveness,
title = {Effectiveness of an electronic nose for monitoring bacterial and fungal growth},
author = {S S Schiffman and D Wyrick and R Gutierrez-Osuna and H T Nagle},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/schiffman2001effectiveness.pdf},
year = {2000},
date = {2000-01-01},
booktitle = {Proceedings of the 7th International Symposium On Olfaction & Electronic Nose},
journal = {Electronic noses and olfaction},
pages = {173--180},
abstract = {Growth of microbial organisms such as bacteria and fungi generates volatile organic compounds and fixed gases. An electronic nose consisting of 15 metal-oxide sensors (NC State E-Nose) was used to detect and classify bacteria and fungi. Three preliminary experiments were conducted with the electronic nose using odorous stimuli related to microbial contamination. The results suggested that the NC State E-Nose could classify bacteria, fungi, and associated volatile organic compounds. A further experiment was performed to detect and classify five fungi commonly found in indoor environments. These fungi were Aspergillus flavus, Aspergillus niger, Penicillium chrysogenum, Cladosporium cladosporioides, and Stachybotrys chartarum. The fungi were cultured on two types of media, Potato Dextrose Agar (PDA) and Czapek-Dox Agar. The NC State E-nose was capable of discriminating among these fungi with up to 96% accuracy.},
keywords = {Electronic nose},
pubstate = {published},
tppubtype = {conference}
}
Growth of microbial organisms such as bacteria and fungi generates volatile organic compounds and fixed gases. An electronic nose consisting of 15 metal-oxide sensors (NC State E-Nose) was used to detect and classify bacteria and fungi. Three preliminary experiments were conducted with the electronic nose using odorous stimuli related to microbial contamination. The results suggested that the NC State E-Nose could classify bacteria, fungi, and associated volatile organic compounds. A further experiment was performed to detect and classify five fungi commonly found in indoor environments. These fungi were Aspergillus flavus, Aspergillus niger, Penicillium chrysogenum, Cladosporium cladosporioides, and Stachybotrys chartarum. The fungi were cultured on two types of media, Potato Dextrose Agar (PDA) and Czapek-Dox Agar. The NC State E-nose was capable of discriminating among these fungi with up to 96% accuracy. |
1999
|
Gutierrez-Osuna, R; Nagle, H T; Schiffman, S S Transient response analysis of an electronic nose using multi-exponential models Journal Article In: Sensors and Actuators B: Chemical, vol. 61, no. 1-3, pp. 170–182, 1999. @article{gutierrez1999transient,
title = {Transient response analysis of an electronic nose using multi-exponential models},
author = {R Gutierrez-Osuna and H T Nagle and S S Schiffman},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez1999transient.pdf},
year = {1999},
date = {1999-01-01},
journal = {Sensors and Actuators B: Chemical},
volume = {61},
number = {1-3},
pages = {170--182},
publisher = {Elsevier},
abstract = {The purpose of this study is to model the transient response of conductivity-based gas sensors in the context of odor recognition with an electronic nose. Commonly, only the steady-state response of the sensor is used for pattern recognition, ignoring the transient response, which conveys useful discriminatory information. The transient response is modeled as a sum of real exponential functions that represent the different decay processes that occur during sampling of the gas into the sensor chamber and adsorption of the odor compounds onto the sensing element. Four multi-exponential models are reviewed: Gardner transform, multi-exponential transient spectroscopy, Pade-Laplace and Pade-Z transforms. Validation on experimental data from an array of conducting-polymer gas sensors shows that the Pade-Laplace and Pade-Z models have better resolution capabilities than the two spectral transforms.},
keywords = {Chemical sensors, Electronic nose, Temperature modulation},
pubstate = {published},
tppubtype = {article}
}
The purpose of this study is to model the transient response of conductivity-based gas sensors in the context of odor recognition with an electronic nose. Commonly, only the steady-state response of the sensor is used for pattern recognition, ignoring the transient response, which conveys useful discriminatory information. The transient response is modeled as a sum of real exponential functions that represent the different decay processes that occur during sampling of the gas into the sensor chamber and adsorption of the odor compounds onto the sensing element. Four multi-exponential models are reviewed: Gardner transform, multi-exponential transient spectroscopy, Pade-Laplace and Pade-Z transforms. Validation on experimental data from an array of conducting-polymer gas sensors shows that the Pade-Laplace and Pade-Z models have better resolution capabilities than the two spectral transforms. |
Gutierrez-Osuna, R; Nagle, H T A method for evaluating data-preprocessing techniques for odour classification with an array of gas sensors Journal Article In: Systems, Man, and Cybernetics, Part B: Cybernetics, IEEE Transactions on, vol. 29, no. 5, pp. 626–632, 1999. @article{gutierrez1999method,
title = {A method for evaluating data-preprocessing techniques for odour classification with an array of gas sensors},
author = {R Gutierrez-Osuna and H T Nagle},
url = {https://psi.engr.tamu.edu/wp-content/uploads/2018/01/gutierrez1999method.pdf},
year = {1999},
date = {1999-01-01},
journal = {Systems, Man, and Cybernetics, Part B: Cybernetics, IEEE Transactions on},
volume = {29},
number = {5},
pages = {626--632},
publisher = {IEEE},
abstract = {The performance of a pattern recognition system is dependent on, among other things, an appropriate data-preprocessing technique, In this paper, we describe a method to evaluate the performance of a variety of these techniques for the problem of odour classification using an array of gas sensors, also referred to as an electronic nose. Four experimental odour databases with different complexities are used to score the data-preprocessing techniques. The performance measure used is the cross-validation estimate of the classification rate of a K nearest neighbor voting rule operating on Fisher's linear discriminant projection subspace.},
keywords = {Chemical sensors},
pubstate = {published},
tppubtype = {article}
}
|