{"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00214037","sets":["1164:5352:10544:10757"]},"path":["10757"],"owner":"44499","recid":"214037","title":["Predicting PRDM9 binding sites by a convolutional neural network and verification using genetic recombination map"],"pubdate":{"attribute_name":"公開日","attribute_value":"2021-11-23"},"_buckets":{"deposit":"231847bc-835d-4ce8-b312-a8f53f812ac8"},"_deposit":{"id":"214037","pid":{"type":"depid","value":"214037","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"Predicting PRDM9 binding sites by a convolutional neural network and verification using genetic recombination map","author_link":["548385","548381","548384","548383","548380","548382"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"Predicting PRDM9 binding sites by a convolutional neural network and verification using genetic recombination map"},{"subitem_title":"Predicting PRDM9 binding sites by a convolutional neural network and verification using genetic recombination map","subitem_title_language":"en"}]},"item_type_id":"4","publish_date":"2021-11-23","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"Graduate School of Information Science and Technology, Hokkaido University"},{"subitem_text_value":"Graduate School of Information Science and Technology, Hokkaido University/Faculty of Information Science and Technology, Hokkaido University"},{"subitem_text_value":"Graduate School of Information Science and Technology, Hokkaido University/Faculty of Information Science and Technology, Hokkaido University"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Graduate School of Information Science and Technology, Hokkaido University","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Information Science and Technology, Hokkaido University / Faculty of Information Science and Technology, Hokkaido University","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Information Science and Technology, Hokkaido University / Faculty of Information Science and Technology, Hokkaido University","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"eng"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/214037/files/IPSJ-BIO21068001.pdf","label":"IPSJ-BIO21068001.pdf"},"date":[{"dateType":"Available","dateValue":"2023-11-23"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-BIO21068001.pdf","filesize":[{"value":"627.5 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"41"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"f79044aa-457e-40b9-959a-36a9bcbcac97","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2021 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Takahiro, Nakamura"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Toshinori, Endo"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Naoki, Osada"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Takahiro, Nakamura","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Toshinori, Endo","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Naoki, Osada","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AA12055912","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8590","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"PR domain-containing 9 (PRDM9) is a zinc-finger protein that binds to specific DNA motifs and induces the crossing-over between chromosomes, resulting in a high recombination rate around binding sites. In this study, we developed a strategy to evaluate the prediction accuracy of PRDM9 binding site by examining the correlation with local recombination rate to avoid the effect of overfitting to one type of data. We compared the methods using position-specific weight matrix (PWM), which has been commonly used in previous studies, and convolutional network (CNN), which has recently performed well. Approximately 170,000 genomic DNA fragments of humans (301 bp each) containing the Chromatin Immuno-Precipitation with high-throughput sequencing (ChIP-seq) peak of PRDM9 of B-allele in the HEK293T cell line were used for constructing PWM and positive data to train CNN. We found that CNN outperformed PWM in terms of area under the curve, and the prediction scores of CNN correlated more strongly with the local recombination rate than PWM. We also investigated the potential PRDM9 binding sites missed by the ChIP-seq experiments but labeled as positive in CNN and discuss the reason for the difference in performances.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"PR domain-containing 9 (PRDM9) is a zinc-finger protein that binds to specific DNA motifs and induces the crossing-over between chromosomes, resulting in a high recombination rate around binding sites. In this study, we developed a strategy to evaluate the prediction accuracy of PRDM9 binding site by examining the correlation with local recombination rate to avoid the effect of overfitting to one type of data. We compared the methods using position-specific weight matrix (PWM), which has been commonly used in previous studies, and convolutional network (CNN), which has recently performed well. Approximately 170,000 genomic DNA fragments of humans (301 bp each) containing the Chromatin Immuno-Precipitation with high-throughput sequencing (ChIP-seq) peak of PRDM9 of B-allele in the HEK293T cell line were used for constructing PWM and positive data to train CNN. We found that CNN outperformed PWM in terms of area under the curve, and the prediction scores of CNN correlated more strongly with the local recombination rate than PWM. We also investigated the potential PRDM9 binding sites missed by the ChIP-seq experiments but labeled as positive in CNN and discuss the reason for the difference in performances.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"7","bibliographic_titles":[{"bibliographic_title":"研究報告バイオ情報学(BIO)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2021-11-23","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"1","bibliographicVolumeNumber":"2021-BIO-68"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"id":214037,"updated":"2025-01-19T16:55:40.454524+00:00","links":{},"created":"2025-01-19T01:14:52.466660+00:00"}