@phdthesis{c813f1c034124b059643cfcbaf50c34a,
title = "Using representative gene sets to validate gene models in legume annotations (Fabaceae)",
abstract = "With more genomes being assembled, it's important to develop accurate annotation tools. Here, we describe a method to support gene model prediction based on evolutionary conservation and use it to identify potentially erroneous annotations across 12 legume species. We first compare the genes for each of the genomes with the whole genome sequence of other assemblies and the NCBI-NR database to identify potentially unique gene models. Then we removed non-conserved gene models and applied a graph-based approach to identify a representative set. This identified 15,345 representative gene models from 12 legume assemblies that can support genome annotations for other legumes.",
keywords = "legume genomes, gene annotation, Fabaceae, genome assembly",
author = "{Tay Fernandez}, Cassandria",
year = "2023",
doi = "10.26182/cvey-9c15",
language = "English",
school = "The University of Western Australia",
}