2021
Sunyong Yoo; Dong-Wook Kim; Young-Eun Kim; Jong Heon Park; Yeon-Yong Kim; Kyu-dong Cho; Mi-Ji Gwon; Jae-In Shin; Eun-Joo Lee
Abstract | Links | BibTeX | Dimensions | Tags: Allergic rhinitis, Asthma, Atopic dermatitis, Database, National health insurance service
@article{yoo2021data,
title = {Data resource profile: the allergic disease database of the Korean National Health Insurance Service},
author = {Sunyong Yoo and Dong-Wook Kim and Young-Eun Kim and Jong Heon Park and Yeon-Yong Kim and Kyu-dong Cho and Mi-Ji Gwon and Jae-In Shin and Eun-Joo Lee},
url = {https://www.ncbi.nlm.nih.gov/pmc/articles/PMC8060521/},
doi = {10.4178/epih.e2021010},
year = {2021},
date = {2021-01-21},
urldate = {2021-01-21},
journal = {Epidemiology and Health},
volume = {43},
pages = {e2021010},
publisher = {Korean Society of Epidemiology},
abstract = {Researchers have been interested in probing how the environmental factors associated with allergic diseases affect the use of medical services. Considering this demand, we have constructed a database, named the Allergic Disease Database, based on the National Health Insurance Database (NHID). The NHID contains information on demographic and medical service utilization for approximately 99% of the Korean population. This study targeted 3 major allergic diseases, including allergic rhinitis, atopic dermatitis, and asthma. For the target diseases, our database provides daily medical service information, including the number of daily visits from 2013 and 2017, categorized by patients’ characteristics such as address, sex, age, and duration of residence. We provide additional information, including yearly population, a number of patients, and averaged geocoding coordinates by eup, myeon, and dong district code (the smallest-scale administrative units in Korea). This information enables researchers to analyze how daily changes in the environmental factors of allergic diseases (e.g., particulate matter, sulfur dioxide, and ozone) in certain regions would influence patients’ behavioral patterns of medical service utilization. Moreover, researchers can analyze long-term trends in allergic diseases and the health effects caused by environmental factors such as daily climate and pollution data. The advantages of this database are easy access to data, additional levels of geographic detail, time-efficient data-refining and processing, and a de-identification process that minimizes the exposure of identifiable personal information. All datasets included in the Allergic Disease Database can be downloaded by accessing the National Health Insurance Service data sharing webpage (https://nhiss.nhis.or.kr).},
keywords = {Allergic rhinitis, Asthma, Atopic dermatitis, Database, National health insurance service},
pubstate = {published},
tppubtype = {article}
}
2018
Sunyong Yoo; Suhyun Ha; Moonshik Shin; Kyungrin Noh; Hojung Nam; Doheon Lee
Abstract | Links | BibTeX | Dimensions | Tags: Database, Drugs, Ethnopharmacology, Machine learning
@article{yoo2018data,
title = {A data-driven approach for identifying medicinal combinations of natural products},
author = {Sunyong Yoo and Suhyun Ha and Moonshik Shin and Kyungrin Noh and Hojung Nam and Doheon Lee},
url = {https://ieeexplore.ieee.org/abstract/document/8482294},
doi = {10.1109/ACCESS.2018.2874089},
year = {2018},
date = {2018-10-05},
urldate = {2018-10-05},
journal = {IEEE Access},
volume = {6},
pages = {58106–58118},
publisher = {IEEE},
abstract = {Combinations of natural products have been used as important sources of disease treatments. Existing databases contain information about prescriptions, herbs, and compounds and their relationships with phenotypes, but they do not have information on the use of combinations of natural product compounds. In this paper, we identified large-scale associations between natural product combinations and phenotypes by applying an association rule mining technique to integrated information on herbal medicine, combination drugs, functional foods, molecular compounds, and target genes. The rationale behind this approach is that natural products commonly found in medicinal multicomponent mixtures have statistically significant associations with the therapeutic effects of the multicomponent mixtures. Based on a molecular network analysis and an external literature validation, we show that the inferred associations are valuable information for identifying medicinal combinations of natural products since they have statistically significant closeness proximity in the molecular layer and have much experimental evidence. All results are available through the workbench site at http://biosoft.kaist.ac.kr/coconut to facilitate the investigation of the medicinal use of natural products and their combinations.},
keywords = {Database, Drugs, Ethnopharmacology, Machine learning},
pubstate = {published},
tppubtype = {article}
}
2016
Jongsoo Keum; Sunyong Yoo; Doheon Lee; Hojung Nam
Abstract | Links | BibTeX | Dimensions | Tags: Bioinformatics, Database, Herbal medicine, Target proteins
@article{keum2016prediction,
title = {Prediction of compound-target interactions of natural products using large-scale drug and protein information},
author = {Jongsoo Keum and Sunyong Yoo and Doheon Lee and Hojung Nam},
url = {https://link.springer.com/article/10.1186/s12859-016-1081-y},
doi = {10.1186/s12859-016-1081-y},
year = {2016},
date = {2016-07-28},
urldate = {2016-07-28},
journal = {BMC bioinformatics},
volume = {17},
number = {219},
pages = {417–425},
publisher = {Springer},
abstract = {Background
Verifying the proteins that are targeted by compounds of natural herbs will be helpful to select natural herb-based drug candidates. However, this entails a great deal of effort to clarify the interaction throughout in vitro or in vivo experiments. In this light, in silico prediction of the interactions between compounds and target proteins can help ease the efforts.
Results
In this study, we performed in silico predictions of herbal compound target identification. First, data related to compounds, target proteins, and interactions between them are taken from the DrugBank database. Then we characterized six classes of compound-target interaction in humans including G-protein-coupled receptors (GPCRs), ion channel, enzymes, receptors, transporters, and other proteins. Also, classification-prediction models that predict the interactions between compounds and target proteins through a machine learning method were constructed using these matrices. As a result, AUC values of six classes are 0.94, 0.93, 0.90, 0.89, 0.91, and 0.76 respectively. Finally, the interactions of compounds from natural products were predicted using the constructed classification models. Furthermore, from our predicted results, we confirmed that several important disease related proteins were predicted as targets of natural herbal compounds.
Conclusions
We constructed classification-prediction models that predict the interactions between compounds and target proteins. The constructed models showed good prediction performances, and numbers of potential natural compounds target proteins were predicted from our results.},
keywords = {Bioinformatics, Database, Herbal medicine, Target proteins},
pubstate = {published},
tppubtype = {article}
}
Verifying the proteins that are targeted by compounds of natural herbs will be helpful to select natural herb-based drug candidates. However, this entails a great deal of effort to clarify the interaction throughout in vitro or in vivo experiments. In this light, in silico prediction of the interactions between compounds and target proteins can help ease the efforts.
Results
In this study, we performed in silico predictions of herbal compound target identification. First, data related to compounds, target proteins, and interactions between them are taken from the DrugBank database. Then we characterized six classes of compound-target interaction in humans including G-protein-coupled receptors (GPCRs), ion channel, enzymes, receptors, transporters, and other proteins. Also, classification-prediction models that predict the interactions between compounds and target proteins through a machine learning method were constructed using these matrices. As a result, AUC values of six classes are 0.94, 0.93, 0.90, 0.89, 0.91, and 0.76 respectively. Finally, the interactions of compounds from natural products were predicted using the constructed classification models. Furthermore, from our predicted results, we confirmed that several important disease related proteins were predicted as targets of natural herbal compounds.
Conclusions
We constructed classification-prediction models that predict the interactions between compounds and target proteins. The constructed models showed good prediction performances, and numbers of potential natural compounds target proteins were predicted from our results.