💿🐜 Antkeeper source code https://antkeeper.com
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

78 lines
3.0 KiB

/*
* Copyright (C) 2021 Christopher J. Howard
*
* This file is part of Antkeeper source code.
*
* Antkeeper source code is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Antkeeper source code is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Antkeeper source code. If not, see <http://www.gnu.org/licenses/>.
*/
#ifndef ANTKEEPER_GENETICS_CODON_HPP
#define ANTKEEPER_GENETICS_CODON_HPP
namespace genetics {
/// Functions and structures related to triplets of IUPAC base symbols.
namespace codon {
/**
* Table for translating codons to amino acids.
*
* @see https://www.ncbi.nlm.nih.gov/Taxonomy/Utils/wprintgc.cgi
*/
struct table
{
/// String of 64 IUPAC amino acid base symbols, in TCAG order.
const char* aas;
/// String of 64 IUPAC amino acid base symbols, in TCAG order, where symbols other than `-` and `*` indicate a start codon and its amino acid.
const char* starts;
};
/**
* Returns `true` if a codon is a start codon.
*
* @param base1 IUPAC base code of first nucleobase, either `U`, `T`, `C`, `A`, or `G`.
* @param base2 IUPAC base code of second nucleobase, either `U`, `T`, `C`, `A`, or `G`.
* @param base3 IUPAC base code of third nucleobase, either `U`, `T`, `C`, `A`, or `G`.
* @param starts String of 64 IUPAC amino acid codes, in TCAG order.
* @return `true` if the codon is a start codon, `false` otherwise.
*/
bool is_start(char base1, char base2, char base3, const char* starts);
/**
* Returns `true` if a codon is a stop codon.
*
* @param base1 IUPAC base code of first nucleobase, either `U`, `T`, `C`, `A`, or `G`.
* @param base2 IUPAC base code of second nucleobase, either `U`, `T`, `C`, `A`, or `G`.
* @param base3 IUPAC base code of third nucleobase, either `U`, `T`, `C`, `A`, or `G`.
* @param aas String of 64 IUPAC amino acid codes, in TCAG order.
* @return `true` if the codon is a stop codon, `false` otherwise.
*/
bool is_stop(char base1, char base2, char base3, const char* aas);
/**
* Translates a codon into an amino acid.
*
* @param base1 IUPAC base code of first nucleobase, either `U`, `T`, `C`, `A`, or `G`.
* @param base2 IUPAC base code of second nucleobase, either `U`, `T`, `C`, `A`, or `G`.
* @param base3 IUPAC base code of third nucleobase, either `U`, `T`, `C`, `A`, or `G`.
* @param aas String of 64 IUPAC amino acid codes, in TCAG order.
* @return IUPAC amino acid code of corresponding amino acid, or `-` if an invalid codon was supplied.
*/
char translate(char base1, char base2, char base3, const char* aas);
} // namspace codon
} // namespace genetics
#endif // ANTKEEPER_GENETICS_CODON_HPP