@article{437e59edf29d42a49abf395234b42070,
title = "Fast and exact gap-affine partial order alignment with POASTA",
abstract = "MotivationPartial order alignment is a widely used method for computing multiple sequence alignments, with applications in genome assembly and pangenomics, among many others. Current algorithms to compute the optimal, gap-affine partial order alignment do not scale well to larger graphs and sequences. While heuristic approaches exist, they do not guarantee optimal alignment and sacrifice alignment accuracy.ResultsWe present POASTA, a new optimal algorithm for partial order alignment that exploits long stretches of matching sequence between the graph and a query. We benchmarked POASTA against the state-of-the-art on several diverse bacterial gene datasets and demonstrated an average speed-up of 4.1x and up to 9.8x, using less memory. POASTA{\textquoteright}s memory scaling characteristics enabled the construction of much larger POA graphs than previously possible, as demonstrated by megabase-length alignments of 342 Mycobacterium tuberculosis sequences.",
keywords = "multiple sequence alignment, partial order alignment, pangenome graphs",
author = "{van Dijk}, {Lucas R.} and Manson, {Abigail L.} and Earl, {Ashlee M.} and Garimella, {Kiran V.} and Thomas Abeel",
year = "2025",
doi = "10.1093/bioinformatics/btae757",
language = "English",
volume = "41",
journal = "Bioinformatics",
issn = "1367-4803",
publisher = "Oxford University Press",
number = "1",
}