@inproceedings{ccbf9b9a65b3442092a0bda2ccdcdac6,
title = "Identifying genomic signatures of n-gram nucleotide sequences to classify the chromatin states of broad histone track",
abstract = "A large proportion of human noncoding DNA had been known to have no biological function. However, unprecedented technical advances have started to convert unannotated noncoding DNA into highly annotated functional regions. In this paper, the frequency of n-grams of regional DNA sequences from fifteen chromatin states of Broad Histone Track are thoroughly analyzed, applying biological language modelling to n-grams. It has been shown that a few particular n-grams are found in abundance in one chromatin state but occurring very rarely in other states, thereby serving as chromatin state signatures. We discuss the significance of the patterns found, as well as their potential use in the special statistical models of nucleotide sequences necessary for developing algorithms for the computational analysis of functional units in noncoding DNA regions.",
keywords = "Computational epigenetics, GC-contents, Methylation states, Noncoding DNA, Nucleotide frequency patterns",
author = "Lee, {Kyung Eun} and Park, {Hyun Seok}",
year = "2015",
month = jan,
day = "8",
doi = "10.1145/2701126.2701131",
language = "English",
series = "ACM IMCOM 2015 - Proceedings",
publisher = "Association for Computing Machinery, Inc",
booktitle = "ACM IMCOM 2015 - Proceedings",
note = "9th International Conference on Ubiquitous Information Management and Communication, ACM IMCOM 2015 ; Conference date: 08-01-2015 Through 10-01-2015",
}