Compare commits
2 Commits
f1fe568818
...
ae3732eba2
Author | SHA1 | Date | |
---|---|---|---|
ae3732eba2 | |||
d42ed83b22 |
10
.vscode/settings.json
vendored
10
.vscode/settings.json
vendored
@ -1,3 +1,11 @@
|
|||||||
{
|
{
|
||||||
"python.formatting.provider": "black"
|
"python.formatting.provider": "black",
|
||||||
|
"cSpell.words": [
|
||||||
|
"Biopython",
|
||||||
|
"BLOSUM",
|
||||||
|
"bmlsa",
|
||||||
|
"FASTA"
|
||||||
|
],
|
||||||
|
"python.testing.pytestEnabled": true,
|
||||||
|
"python.analysis.inlayHints.pytestParameters": true
|
||||||
}
|
}
|
10
Jenkinsfile
vendored
10
Jenkinsfile
vendored
@ -12,14 +12,20 @@ pipeline {
|
|||||||
sh 'echo "mamba activate bmlsa" >> ~/.bashrc'
|
sh 'echo "mamba activate bmlsa" >> ~/.bashrc'
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
stage("unit tests") {
|
||||||
|
steps {
|
||||||
|
sh "python -m pytest --junitxml=test_results.xml"
|
||||||
|
xunit checksName: '', tools: [JUnit(excludesPattern: '', pattern: 'test_results.xml', stopProcessingIfError: true)]
|
||||||
|
}
|
||||||
|
}
|
||||||
stage("build") {
|
stage("build") {
|
||||||
steps {
|
steps {
|
||||||
sh "python -m build"
|
sh "python -m build"
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
stage("test") {
|
stage("test installation") {
|
||||||
steps {
|
steps {
|
||||||
sh "pip install dist/*.whl"
|
sh "pip install dist/*.whl --force-reinstall"
|
||||||
sh "bmlsa -h"
|
sh "bmlsa -h"
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
12
README.md
12
README.md
@ -1,3 +1,13 @@
|
|||||||
# BMLSA
|
# BMLSA
|
||||||
|
|
||||||
A Basic multi local sequence alignment tool using the Biopython implementation of the Smith-Waterman alignment algorithm
|
A Basic multi local sequence alignment tool using the Biopython implementation of the Smith-Waterman alignment algorithm.
|
||||||
|
|
||||||
|
## Features
|
||||||
|
|
||||||
|
- Aligns a CSV of short sequences locally to a given reference sequence
|
||||||
|
- Outputs in a CSV with old and new positions
|
||||||
|
- Selectable parameters for alignment
|
||||||
|
- Compatible with broad-range of input CSV formats
|
||||||
|
- Automatically align with all sequences in reference FASTA
|
||||||
|
- All produced output is human readable!
|
||||||
|
|
||||||
|
94
bmlsa/cli.py
94
bmlsa/cli.py
@ -1,94 +0,0 @@
|
|||||||
import os
|
|
||||||
import argparse
|
|
||||||
from Bio import SeqIO
|
|
||||||
from bmlsa.aligner import protein_align_many_to_one_ssw
|
|
||||||
|
|
||||||
from bmlsa.persistence import read_annotations_from_csv, save_alignments_to_csv
|
|
||||||
|
|
||||||
|
|
||||||
def main():
|
|
||||||
argparser = argparse.ArgumentParser("blmsa")
|
|
||||||
argparser.add_argument(
|
|
||||||
"annotations",
|
|
||||||
type=str,
|
|
||||||
help=(
|
|
||||||
"Path to CSV containing the sequences to align as well as the "
|
|
||||||
"annotations for the respective sequences"
|
|
||||||
),
|
|
||||||
metavar="a",
|
|
||||||
)
|
|
||||||
argparser.add_argument(
|
|
||||||
"sequence",
|
|
||||||
type=str,
|
|
||||||
help=(
|
|
||||||
"Path to the sequence to annotate in FASTA format. "
|
|
||||||
"If multiple sequences are present, annotations will be run on each"
|
|
||||||
),
|
|
||||||
metavar="s",
|
|
||||||
)
|
|
||||||
argparser.add_argument(
|
|
||||||
"output", type=str, help="Path to output location", metavar="o"
|
|
||||||
)
|
|
||||||
argparser.add_argument(
|
|
||||||
"-I", "--id-header", type=str, help="The header for the ID of the annotation"
|
|
||||||
)
|
|
||||||
argparser.add_argument(
|
|
||||||
"-N",
|
|
||||||
"--name-header",
|
|
||||||
type=str,
|
|
||||||
help="The header for the name of the annotation",
|
|
||||||
required=False,
|
|
||||||
)
|
|
||||||
argparser.add_argument(
|
|
||||||
"-D",
|
|
||||||
"--desc-header",
|
|
||||||
type=str,
|
|
||||||
help="The header for the description of the annotation",
|
|
||||||
required=False,
|
|
||||||
)
|
|
||||||
argparser.add_argument(
|
|
||||||
"-T",
|
|
||||||
"--start-header",
|
|
||||||
type=str,
|
|
||||||
help="The header for the start of the annotation",
|
|
||||||
required=False,
|
|
||||||
)
|
|
||||||
argparser.add_argument(
|
|
||||||
"-E",
|
|
||||||
"--end-header",
|
|
||||||
type=str,
|
|
||||||
help="The header for the end of the annotation",
|
|
||||||
required=False,
|
|
||||||
)
|
|
||||||
argparser.add_argument(
|
|
||||||
"-S",
|
|
||||||
"--seq-header",
|
|
||||||
type=str,
|
|
||||||
help="The header for the sequence of the annotation",
|
|
||||||
)
|
|
||||||
args = argparser.parse_args()
|
|
||||||
given_annotations = read_annotations_from_csv(
|
|
||||||
args.annotations,
|
|
||||||
args.id_header,
|
|
||||||
args.name_header,
|
|
||||||
args.desc_header,
|
|
||||||
args.start_header,
|
|
||||||
args.end_header,
|
|
||||||
args.seq_header,
|
|
||||||
)
|
|
||||||
with open(args.sequence, "r") as sequence_fd:
|
|
||||||
for sequence in SeqIO.parse(sequence_fd, "fasta"):
|
|
||||||
aligned_annotations = protein_align_many_to_one_ssw(
|
|
||||||
str(sequence.seq), given_annotations
|
|
||||||
)
|
|
||||||
save_alignments_to_csv(
|
|
||||||
aligned_annotations,
|
|
||||||
os.path.join(
|
|
||||||
args.output,
|
|
||||||
sequence.id.replace("|", "+").replace(".", "_") + ".csv",
|
|
||||||
),
|
|
||||||
)
|
|
||||||
|
|
||||||
|
|
||||||
if __name__ == "__main__":
|
|
||||||
main()
|
|
@ -4,5 +4,8 @@ channels:
|
|||||||
dependencies:
|
dependencies:
|
||||||
- biopython=1.81
|
- biopython=1.81
|
||||||
- build=0.7
|
- build=0.7
|
||||||
- pytest=7
|
- pytest=7.3
|
||||||
|
- hypothesis=6.56
|
||||||
- twine=4
|
- twine=4
|
||||||
|
- python-build=0.10.0
|
||||||
|
- setuptools
|
11
setup.cfg
11
setup.cfg
@ -1,12 +1,17 @@
|
|||||||
[metadata]
|
[metadata]
|
||||||
name = bmlsa
|
name = bmlsa
|
||||||
version = 0.0.3
|
version = 0.0.4
|
||||||
|
|
||||||
[options]
|
[options]
|
||||||
packages = bmlsa
|
package_dir =
|
||||||
|
= src
|
||||||
install_requires =
|
install_requires =
|
||||||
biopython ==1.81
|
biopython ==1.81
|
||||||
|
|
||||||
[options.entry_points]
|
[options.entry_points]
|
||||||
console_scripts =
|
console_scripts =
|
||||||
bmlsa = bmlsa.cli:main
|
bmlsa = bmlsa.cli:main
|
||||||
|
|
||||||
|
[tool:pytest]
|
||||||
|
pythonpath = src
|
||||||
|
testpaths = tests
|
@ -1,20 +1,35 @@
|
|||||||
|
import logging
|
||||||
|
from typing import Iterable
|
||||||
from Bio.Align import PairwiseAligner, substitution_matrices
|
from Bio.Align import PairwiseAligner, substitution_matrices
|
||||||
from bmlsa.datatypes import AlignedSequence
|
from bmlsa.datatypes import AlignedSequence
|
||||||
from bmlsa.exceptions import UnexpectedAlignmentResult
|
from bmlsa.exceptions import UnexpectedAlignmentResult
|
||||||
|
|
||||||
|
logger = logging.getLogger(__name__)
|
||||||
|
|
||||||
def protein_align_many_to_one_ssw(sequence: str, queries: dict[str, AlignedSequence]):
|
|
||||||
annotation_pairs = {}
|
def align_many_to_one_ssw(
|
||||||
|
reference_sequence: str,
|
||||||
|
queries: Iterable[AlignedSequence],
|
||||||
|
extend_gap_score: int,
|
||||||
|
open_gap_score: int,
|
||||||
|
alignment_mode: str,
|
||||||
|
substitution_matrix: str = "BLOSUM62",
|
||||||
|
):
|
||||||
|
# TODO Consider using the built in "scoring" parameter
|
||||||
aligner = PairwiseAligner()
|
aligner = PairwiseAligner()
|
||||||
aligner.mode = "local"
|
aligner.substitution_matrix = substitution_matrices.load(substitution_matrix)
|
||||||
aligner.substitution_matrix = substitution_matrices.load("BLOSUM62")
|
aligner.extend_gap_score = extend_gap_score
|
||||||
aligner.extend_gap_score = -1
|
aligner.open_gap_score = open_gap_score
|
||||||
aligner.open_gap_score = -11
|
aligner.mode = alignment_mode
|
||||||
for id, query in queries.items():
|
for query in queries:
|
||||||
try:
|
try:
|
||||||
alignments = aligner.align(sequence, query.sequence)
|
alignments = aligner.align(reference_sequence, query.sequence)
|
||||||
except ValueError:
|
except ValueError:
|
||||||
|
logger.warning(
|
||||||
|
'Skipping sequence with id "%s" due to invalid characters', query.id
|
||||||
|
)
|
||||||
continue
|
continue
|
||||||
|
# TODO Implement comparison with input positions to choose best
|
||||||
if len(alignments) > 1:
|
if len(alignments) > 1:
|
||||||
raise UnexpectedAlignmentResult(
|
raise UnexpectedAlignmentResult(
|
||||||
"More than one alignment resulted from a single query."
|
"More than one alignment resulted from a single query."
|
||||||
@ -22,8 +37,8 @@ def protein_align_many_to_one_ssw(sequence: str, queries: dict[str, AlignedSeque
|
|||||||
for alignment in alignments:
|
for alignment in alignments:
|
||||||
score, query_aligned = (alignment.score, alignment.aligned[0][0])
|
score, query_aligned = (alignment.score, alignment.aligned[0][0])
|
||||||
aligned_start, aligned_end = query_aligned
|
aligned_start, aligned_end = query_aligned
|
||||||
annotation_pairs[id] = AlignedSequence(
|
yield AlignedSequence(
|
||||||
id,
|
query.id,
|
||||||
query.sequence,
|
query.sequence,
|
||||||
query.name,
|
query.name,
|
||||||
query.description,
|
query.description,
|
||||||
@ -31,7 +46,7 @@ def protein_align_many_to_one_ssw(sequence: str, queries: dict[str, AlignedSeque
|
|||||||
query.end,
|
query.end,
|
||||||
query.score,
|
query.score,
|
||||||
), AlignedSequence(
|
), AlignedSequence(
|
||||||
id,
|
query.id,
|
||||||
alignment.query,
|
alignment.query,
|
||||||
query.name,
|
query.name,
|
||||||
query.description,
|
query.description,
|
||||||
@ -39,4 +54,3 @@ def protein_align_many_to_one_ssw(sequence: str, queries: dict[str, AlignedSeque
|
|||||||
aligned_end,
|
aligned_end,
|
||||||
score,
|
score,
|
||||||
)
|
)
|
||||||
return annotation_pairs
|
|
191
src/bmlsa/cli.py
Normal file
191
src/bmlsa/cli.py
Normal file
@ -0,0 +1,191 @@
|
|||||||
|
import os
|
||||||
|
import argparse
|
||||||
|
from Bio import SeqIO
|
||||||
|
import logging
|
||||||
|
from bmlsa.aligner import align_many_to_one_ssw
|
||||||
|
|
||||||
|
from bmlsa.io import read_annotations_from_csv, save_alignments_to_csv
|
||||||
|
|
||||||
|
logger = logging.getLogger(__name__)
|
||||||
|
|
||||||
|
DEFAULT_ALIGNMENT_PARAMETERS = {
|
||||||
|
"BLASTp": {
|
||||||
|
"extend_gap_score": -1,
|
||||||
|
"open_gap_score": -11,
|
||||||
|
"substitution_matrix": "BLOSUM62",
|
||||||
|
"alignment_mode": "local",
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
def run(args):
|
||||||
|
if (
|
||||||
|
not (args.extend_gap_score and args.open_gap_score and args.alignment_mode)
|
||||||
|
and not args.behave_as
|
||||||
|
):
|
||||||
|
logger.error(
|
||||||
|
'Must either specify all of "--extend-gap-score", "--open-gap-score", '
|
||||||
|
'"--alignment-mode", or, at least "--behave-as". See help (-h) for '
|
||||||
|
"more information."
|
||||||
|
)
|
||||||
|
exit(1)
|
||||||
|
queries = read_annotations_from_csv(
|
||||||
|
args.annotations,
|
||||||
|
args.id_header,
|
||||||
|
args.seq_header,
|
||||||
|
args.name_header,
|
||||||
|
args.desc_header,
|
||||||
|
args.start_header,
|
||||||
|
args.end_header,
|
||||||
|
)
|
||||||
|
|
||||||
|
scoring_parameter = (
|
||||||
|
{
|
||||||
|
"extend_gap_score": args.extend_gap_score,
|
||||||
|
"open_gap_score": args.open_gap_score,
|
||||||
|
"alignment_mode": args.alignment_mode,
|
||||||
|
"substitution_matrix": args.substitution_matrix
|
||||||
|
if args.substitution_matrix is not None
|
||||||
|
else "BLOSUM62",
|
||||||
|
}
|
||||||
|
if args.behave_as not in DEFAULT_ALIGNMENT_PARAMETERS
|
||||||
|
else DEFAULT_ALIGNMENT_PARAMETERS[args.behave_as]
|
||||||
|
)
|
||||||
|
|
||||||
|
with open(args.sequence, "r") as sequence_fd:
|
||||||
|
for sequence in SeqIO.parse(sequence_fd, "fasta"):
|
||||||
|
aligned_annotations = align_many_to_one_ssw(
|
||||||
|
str(sequence.seq), queries, **scoring_parameter
|
||||||
|
)
|
||||||
|
save_alignments_to_csv(
|
||||||
|
aligned_annotations,
|
||||||
|
os.path.join(
|
||||||
|
args.output,
|
||||||
|
sequence.id.replace("|", "+").replace(".", "_") + ".csv",
|
||||||
|
),
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
def main():
|
||||||
|
arg_parser = argparse.ArgumentParser("bmlsa")
|
||||||
|
arg_parser.add_argument(
|
||||||
|
"annotations",
|
||||||
|
type=str,
|
||||||
|
help=(
|
||||||
|
"Path to CSV containing the sequences to align as well as the "
|
||||||
|
"annotations for the respective sequences."
|
||||||
|
),
|
||||||
|
metavar="a",
|
||||||
|
)
|
||||||
|
arg_parser.add_argument(
|
||||||
|
"sequence",
|
||||||
|
type=str,
|
||||||
|
help=(
|
||||||
|
"Path to the sequence to use as reference in FASTA format. "
|
||||||
|
"If multiple sequences are present in the same FASTA file, "
|
||||||
|
"each will be used as a separate reference sequence for separate "
|
||||||
|
"runs automatically."
|
||||||
|
),
|
||||||
|
metavar="s",
|
||||||
|
)
|
||||||
|
arg_parser.add_argument(
|
||||||
|
"output", type=str, help="Path to output location", metavar="o"
|
||||||
|
)
|
||||||
|
arg_parser.add_argument(
|
||||||
|
"-I",
|
||||||
|
"--id-header",
|
||||||
|
type=str,
|
||||||
|
help="The header of the column for the ID of the sequence to align to "
|
||||||
|
"the reference sequence.",
|
||||||
|
required=True,
|
||||||
|
)
|
||||||
|
arg_parser.add_argument(
|
||||||
|
"-N",
|
||||||
|
"--name-header",
|
||||||
|
type=str,
|
||||||
|
help="The header of the column for the name of the sequence to align to "
|
||||||
|
"the reference sequence.",
|
||||||
|
required=False,
|
||||||
|
)
|
||||||
|
arg_parser.add_argument(
|
||||||
|
"-D",
|
||||||
|
"--desc-header",
|
||||||
|
type=str,
|
||||||
|
help="The header of the column for the description of the sequence to "
|
||||||
|
"align to the reference sequence.",
|
||||||
|
required=False,
|
||||||
|
)
|
||||||
|
arg_parser.add_argument(
|
||||||
|
"-T",
|
||||||
|
"--start-header",
|
||||||
|
type=str,
|
||||||
|
help="The header of the column for the start position of the sequence to "
|
||||||
|
"align to the reference sequence.",
|
||||||
|
required=False,
|
||||||
|
)
|
||||||
|
arg_parser.add_argument(
|
||||||
|
"-E",
|
||||||
|
"--end-header",
|
||||||
|
type=str,
|
||||||
|
help="The header of the column for end position of the sequence to "
|
||||||
|
"align to the reference sequence.",
|
||||||
|
required=False,
|
||||||
|
)
|
||||||
|
arg_parser.add_argument(
|
||||||
|
"-S",
|
||||||
|
"--seq-header",
|
||||||
|
type=str,
|
||||||
|
help="The header of the column for the actual sequence to align to the "
|
||||||
|
"reference sequence.",
|
||||||
|
required=True,
|
||||||
|
)
|
||||||
|
arg_parser.add_argument(
|
||||||
|
"-e",
|
||||||
|
"--extend-gap-score",
|
||||||
|
type=int,
|
||||||
|
help="The scoring for extending a gap.",
|
||||||
|
required=False,
|
||||||
|
default=None,
|
||||||
|
)
|
||||||
|
arg_parser.add_argument(
|
||||||
|
"-o",
|
||||||
|
"--open-gap-score",
|
||||||
|
type=int,
|
||||||
|
help="The scoring for opening a gap.",
|
||||||
|
required=False,
|
||||||
|
default=None,
|
||||||
|
)
|
||||||
|
arg_parser.add_argument(
|
||||||
|
"-M",
|
||||||
|
"--alignment-mode",
|
||||||
|
type=str,
|
||||||
|
help="The alignment mode.",
|
||||||
|
choices=["local", "global"],
|
||||||
|
required=False,
|
||||||
|
)
|
||||||
|
arg_parser.add_argument(
|
||||||
|
"-m",
|
||||||
|
"--substitution-matrix",
|
||||||
|
type="str",
|
||||||
|
help="The name of the substitution matrix.",
|
||||||
|
required=False,
|
||||||
|
default=None,
|
||||||
|
)
|
||||||
|
arg_parser.add_argument(
|
||||||
|
"-B",
|
||||||
|
"--behave-as",
|
||||||
|
type=str,
|
||||||
|
help="Use built-in parameters for alignment scoring. If this is specified "
|
||||||
|
"along either of the scoring arguments, the alignment parameter arguments "
|
||||||
|
'("--open-gap-score" and/or "--extend-gab-score" and "--alignment-mode") '
|
||||||
|
"will override any defaults set by this argument.",
|
||||||
|
required=False,
|
||||||
|
default=None,
|
||||||
|
)
|
||||||
|
arg_parser.add
|
||||||
|
args = arg_parser.parse_args()
|
||||||
|
run(args)
|
||||||
|
|
||||||
|
|
||||||
|
if __name__ == "__main__":
|
||||||
|
main()
|
@ -1,4 +1,5 @@
|
|||||||
import csv
|
import csv
|
||||||
|
from typing import Iterable
|
||||||
|
|
||||||
from bmlsa.datatypes import AlignedSequence
|
from bmlsa.datatypes import AlignedSequence
|
||||||
|
|
||||||
@ -6,39 +7,39 @@ from bmlsa.datatypes import AlignedSequence
|
|||||||
def read_annotations_from_csv(
|
def read_annotations_from_csv(
|
||||||
csv_path: str,
|
csv_path: str,
|
||||||
id_header: str,
|
id_header: str,
|
||||||
name_header: str,
|
|
||||||
desc_header: str,
|
|
||||||
start_header: str,
|
|
||||||
end_header: str,
|
|
||||||
sequence_header: str,
|
sequence_header: str,
|
||||||
|
name_header: str = None,
|
||||||
|
desc_header: str = None,
|
||||||
|
start_header: str = None,
|
||||||
|
end_header: str = None,
|
||||||
):
|
):
|
||||||
annotations = {}
|
annotations = {}
|
||||||
with open(csv_path, "r") as csv_fd:
|
with open(csv_path, "r") as csv_fd:
|
||||||
reader = csv.reader(csv_fd)
|
reader = csv.reader(csv_fd)
|
||||||
id_ind = None
|
id_ind = None
|
||||||
|
sequence_ind = None
|
||||||
name_ind = None
|
name_ind = None
|
||||||
desc_ind = None
|
desc_ind = None
|
||||||
start_ind = None
|
start_ind = None
|
||||||
end_ind = None
|
end_ind = None
|
||||||
sequence_ind = None
|
|
||||||
headers_parsed = False
|
headers_parsed = False
|
||||||
for row in reader:
|
for row in reader:
|
||||||
if not headers_parsed:
|
if not headers_parsed:
|
||||||
id_ind = row.index(id_header)
|
id_ind = row.index(id_header)
|
||||||
|
sequence_ind = row.index(sequence_header)
|
||||||
name_ind = row.index(name_header) if name_header else None
|
name_ind = row.index(name_header) if name_header else None
|
||||||
desc_ind = row.index(desc_header) if desc_header else None
|
desc_ind = row.index(desc_header) if desc_header else None
|
||||||
start_ind = row.index(start_header) if start_header else None
|
start_ind = row.index(start_header) if start_header else None
|
||||||
end_ind = row.index(end_header) if end_header else None
|
end_ind = row.index(end_header) if end_header else None
|
||||||
sequence_ind = row.index(sequence_header)
|
|
||||||
headers_parsed = True
|
headers_parsed = True
|
||||||
continue
|
continue
|
||||||
id = row[id_ind]
|
id = row[id_ind]
|
||||||
|
sequence = row[sequence_ind]
|
||||||
name = row[name_ind] if name_header else None
|
name = row[name_ind] if name_header else None
|
||||||
desc = row[desc_ind] if desc_header else None
|
desc = row[desc_ind] if desc_header else None
|
||||||
start = row[start_ind] if start_header else None
|
start = row[start_ind] if start_header else None
|
||||||
end = row[end_ind] if end_header else None
|
end = row[end_ind] if end_header else None
|
||||||
sequence = row[sequence_ind]
|
yield AlignedSequence(
|
||||||
annotations[id] = AlignedSequence(
|
|
||||||
id,
|
id,
|
||||||
sequence,
|
sequence,
|
||||||
name,
|
name,
|
||||||
@ -46,18 +47,16 @@ def read_annotations_from_csv(
|
|||||||
int(start) if start else None,
|
int(start) if start else None,
|
||||||
int(end) if end else None,
|
int(end) if end else None,
|
||||||
)
|
)
|
||||||
return annotations
|
|
||||||
|
|
||||||
|
|
||||||
def save_alignments_to_csv(
|
def save_alignments_to_csv(
|
||||||
aligned_pairs: dict[str, tuple[AlignedSequence, AlignedSequence]], output_path: str
|
aligned_pairs: Iterable[tuple[AlignedSequence, AlignedSequence]], output_path: str
|
||||||
):
|
):
|
||||||
with open(output_path, "w") as output_fd:
|
with open(output_path, "w") as output_fd:
|
||||||
writer = csv.writer(output_fd)
|
writer = csv.writer(output_fd)
|
||||||
header_wrote = False
|
header_wrote = False
|
||||||
header_order = None
|
header_order = None
|
||||||
for id, annotations in aligned_pairs.items():
|
for original, aligned in aligned_pairs:
|
||||||
original, aligned = annotations
|
|
||||||
original_vars = vars(original)
|
original_vars = vars(original)
|
||||||
aligned_vars = vars(aligned)
|
aligned_vars = vars(aligned)
|
||||||
if not header_wrote:
|
if not header_wrote:
|
51
tests/bmlsa/test_aligner.py
Normal file
51
tests/bmlsa/test_aligner.py
Normal file
@ -0,0 +1,51 @@
|
|||||||
|
import pytest
|
||||||
|
from Bio import SeqIO
|
||||||
|
from bmlsa.aligner import align_many_to_one_ssw
|
||||||
|
from bmlsa.cli import DEFAULT_ALIGNMENT_PARAMETERS
|
||||||
|
from bmlsa.datatypes import AlignedSequence
|
||||||
|
from collections.abc import Iterable
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.fixture
|
||||||
|
def reference_sequence():
|
||||||
|
return str(
|
||||||
|
list(SeqIO.parse("tests/resources/NC_045512_coding.fasta", "fasta"))[0].seq
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.fixture
|
||||||
|
def queries():
|
||||||
|
return [
|
||||||
|
AlignedSequence(
|
||||||
|
"ORF10",
|
||||||
|
"ATGGGCTATATAAACGTTTTCGCTTTTCCGTTTACGATATATAGTCTACTCTTGTGCAGAAT"
|
||||||
|
"GAATTCTCGTAACTACATAGCACAAGTAGATGTAGTTAACTTTAATCTCACATAG",
|
||||||
|
start=29558,
|
||||||
|
end=29674,
|
||||||
|
)
|
||||||
|
]
|
||||||
|
|
||||||
|
|
||||||
|
def test_align_many_to_one_returns_data(reference_sequence, queries):
|
||||||
|
results = align_many_to_one_ssw(
|
||||||
|
reference_sequence, queries, **DEFAULT_ALIGNMENT_PARAMETERS["BLASTp"]
|
||||||
|
)
|
||||||
|
assert isinstance(results, Iterable)
|
||||||
|
|
||||||
|
|
||||||
|
def test_align_many_to_one_returns_correct_data_structure(reference_sequence, queries):
|
||||||
|
results = align_many_to_one_ssw(
|
||||||
|
reference_sequence, queries, **DEFAULT_ALIGNMENT_PARAMETERS["BLASTp"]
|
||||||
|
)
|
||||||
|
for original, aligned_seq in results:
|
||||||
|
assert isinstance(original, AlignedSequence)
|
||||||
|
assert isinstance(aligned_seq, AlignedSequence)
|
||||||
|
|
||||||
|
|
||||||
|
def test_align_many_to_one_returns_correct_data(reference_sequence, queries):
|
||||||
|
results = align_many_to_one_ssw(
|
||||||
|
reference_sequence, queries, **DEFAULT_ALIGNMENT_PARAMETERS["BLASTp"]
|
||||||
|
)
|
||||||
|
for original, aligned_seq in results:
|
||||||
|
assert original.start == aligned_seq.start
|
||||||
|
assert original.end == aligned_seq.end
|
35
tests/bmlsa/test_io.py
Normal file
35
tests/bmlsa/test_io.py
Normal file
@ -0,0 +1,35 @@
|
|||||||
|
from csv import reader
|
||||||
|
from os import path
|
||||||
|
from bmlsa.datatypes import AlignedSequence
|
||||||
|
from bmlsa.io import read_annotations_from_csv, save_alignments_to_csv
|
||||||
|
from collections.abc import Iterable
|
||||||
|
|
||||||
|
|
||||||
|
def test_read_annotations_from_csv_has_data():
|
||||||
|
results = read_annotations_from_csv(
|
||||||
|
"tests/resources/SARS_CoV-2_genes.csv", "id", "sequence"
|
||||||
|
)
|
||||||
|
assert isinstance(results, Iterable)
|
||||||
|
|
||||||
|
|
||||||
|
def test_read_annotations_from_csv_data_valid():
|
||||||
|
results = read_annotations_from_csv(
|
||||||
|
"tests/resources/SARS_CoV-2_genes.csv", "id", "sequence"
|
||||||
|
)
|
||||||
|
for aligned_seq in results:
|
||||||
|
assert isinstance(aligned_seq.id, str)
|
||||||
|
assert isinstance(aligned_seq.sequence, str)
|
||||||
|
|
||||||
|
|
||||||
|
def test_save_alignments_to_csv_produces_correct_headers_in_csv(tmpdir):
|
||||||
|
output_path = path.join(tmpdir, "alignment_results.csv")
|
||||||
|
dummy_sequence = AlignedSequence("DUMMY", "ATACTGGAAAA", name="test_sequence")
|
||||||
|
alignments = [(dummy_sequence, dummy_sequence)]
|
||||||
|
save_alignments_to_csv(alignments, output_path)
|
||||||
|
|
||||||
|
with open(output_path, "r") as csv_fd:
|
||||||
|
results = list(reader(csv_fd))
|
||||||
|
vars_to_check = list(vars(dummy_sequence).keys())
|
||||||
|
for var_to_check in vars_to_check:
|
||||||
|
assert "original" + var_to_check in results[0]
|
||||||
|
assert "aligned" + var_to_check in results[0]
|
430
tests/resources/NC_045512_coding.fasta
Normal file
430
tests/resources/NC_045512_coding.fasta
Normal file
@ -0,0 +1,430 @@
|
|||||||
|
>NC_045512.2 Severe acute respiratory syndrome coronavirus 2 isolate Wuhan-Hu-1, complete genome
|
||||||
|
ATTAAAGGTTTATACCTTCCCAGGTAACAAACCAACCAACTTTCGATCTCTTGTAGATCTGTTCTCTAAA
|
||||||
|
CGAACTTTAAAATCTGTGTGGCTGTCACTCGGCTGCATGCTTAGTGCACTCACGCAGTATAATTAATAAC
|
||||||
|
TAATTACTGTCGTTGACAGGACACGAGTAACTCGTCTATCTTCTGCAGGCTGCTTACGGTTTCGTCCGTG
|
||||||
|
TTGCAGCCGATCATCAGCACATCTAGGTTTCGTCCGGGTGTGACCGAAAGGTAAGATGGAGAGCCTTGTC
|
||||||
|
CCTGGTTTCAACGAGAAAACACACGTCCAACTCAGTTTGCCTGTTTTACAGGTTCGCGACGTGCTCGTAC
|
||||||
|
GTGGCTTTGGAGACTCCGTGGAGGAGGTCTTATCAGAGGCACGTCAACATCTTAAAGATGGCACTTGTGG
|
||||||
|
CTTAGTAGAAGTTGAAAAAGGCGTTTTGCCTCAACTTGAACAGCCCTATGTGTTCATCAAACGTTCGGAT
|
||||||
|
GCTCGAACTGCACCTCATGGTCATGTTATGGTTGAGCTGGTAGCAGAACTCGAAGGCATTCAGTACGGTC
|
||||||
|
GTAGTGGTGAGACACTTGGTGTCCTTGTCCCTCATGTGGGCGAAATACCAGTGGCTTACCGCAAGGTTCT
|
||||||
|
TCTTCGTAAGAACGGTAATAAAGGAGCTGGTGGCCATAGTTACGGCGCCGATCTAAAGTCATTTGACTTA
|
||||||
|
GGCGACGAGCTTGGCACTGATCCTTATGAAGATTTTCAAGAAAACTGGAACACTAAACATAGCAGTGGTG
|
||||||
|
TTACCCGTGAACTCATGCGTGAGCTTAACGGAGGGGCATACACTCGCTATGTCGATAACAACTTCTGTGG
|
||||||
|
CCCTGATGGCTACCCTCTTGAGTGCATTAAAGACCTTCTAGCACGTGCTGGTAAAGCTTCATGCACTTTG
|
||||||
|
TCCGAACAACTGGACTTTATTGACACTAAGAGGGGTGTATACTGCTGCCGTGAACATGAGCATGAAATTG
|
||||||
|
CTTGGTACACGGAACGTTCTGAAAAGAGCTATGAATTGCAGACACCTTTTGAAATTAAATTGGCAAAGAA
|
||||||
|
ATTTGACACCTTCAATGGGGAATGTCCAAATTTTGTATTTCCCTTAAATTCCATAATCAAGACTATTCAA
|
||||||
|
CCAAGGGTTGAAAAGAAAAAGCTTGATGGCTTTATGGGTAGAATTCGATCTGTCTATCCAGTTGCGTCAC
|
||||||
|
CAAATGAATGCAACCAAATGTGCCTTTCAACTCTCATGAAGTGTGATCATTGTGGTGAAACTTCATGGCA
|
||||||
|
GACGGGCGATTTTGTTAAAGCCACTTGCGAATTTTGTGGCACTGAGAATTTGACTAAAGAAGGTGCCACT
|
||||||
|
ACTTGTGGTTACTTACCCCAAAATGCTGTTGTTAAAATTTATTGTCCAGCATGTCACAATTCAGAAGTAG
|
||||||
|
GACCTGAGCATAGTCTTGCCGAATACCATAATGAATCTGGCTTGAAAACCATTCTTCGTAAGGGTGGTCG
|
||||||
|
CACTATTGCCTTTGGAGGCTGTGTGTTCTCTTATGTTGGTTGCCATAACAAGTGTGCCTATTGGGTTCCA
|
||||||
|
CGTGCTAGCGCTAACATAGGTTGTAACCATACAGGTGTTGTTGGAGAAGGTTCCGAAGGTCTTAATGACA
|
||||||
|
ACCTTCTTGAAATACTCCAAAAAGAGAAAGTCAACATCAATATTGTTGGTGACTTTAAACTTAATGAAGA
|
||||||
|
GATCGCCATTATTTTGGCATCTTTTTCTGCTTCCACAAGTGCTTTTGTGGAAACTGTGAAAGGTTTGGAT
|
||||||
|
TATAAAGCATTCAAACAAATTGTTGAATCCTGTGGTAATTTTAAAGTTACAAAAGGAAAAGCTAAAAAAG
|
||||||
|
GTGCCTGGAATATTGGTGAACAGAAATCAATACTGAGTCCTCTTTATGCATTTGCATCAGAGGCTGCTCG
|
||||||
|
TGTTGTACGATCAATTTTCTCCCGCACTCTTGAAACTGCTCAAAATTCTGTGCGTGTTTTACAGAAGGCC
|
||||||
|
GCTATAACAATACTAGATGGAATTTCACAGTATTCACTGAGACTCATTGATGCTATGATGTTCACATCTG
|
||||||
|
ATTTGGCTACTAACAATCTAGTTGTAATGGCCTACATTACAGGTGGTGTTGTTCAGTTGACTTCGCAGTG
|
||||||
|
GCTAACTAACATCTTTGGCACTGTTTATGAAAAACTCAAACCCGTCCTTGATTGGCTTGAAGAGAAGTTT
|
||||||
|
AAGGAAGGTGTAGAGTTTCTTAGAGACGGTTGGGAAATTGTTAAATTTATCTCAACCTGTGCTTGTGAAA
|
||||||
|
TTGTCGGTGGACAAATTGTCACCTGTGCAAAGGAAATTAAGGAGAGTGTTCAGACATTCTTTAAGCTTGT
|
||||||
|
AAATAAATTTTTGGCTTTGTGTGCTGACTCTATCATTATTGGTGGAGCTAAACTTAAAGCCTTGAATTTA
|
||||||
|
GGTGAAACATTTGTCACGCACTCAAAGGGATTGTACAGAAAGTGTGTTAAATCCAGAGAAGAAACTGGCC
|
||||||
|
TACTCATGCCTCTAAAAGCCCCAAAAGAAATTATCTTCTTAGAGGGAGAAACACTTCCCACAGAAGTGTT
|
||||||
|
AACAGAGGAAGTTGTCTTGAAAACTGGTGATTTACAACCATTAGAACAACCTACTAGTGAAGCTGTTGAA
|
||||||
|
GCTCCATTGGTTGGTACACCAGTTTGTATTAACGGGCTTATGTTGCTCGAAATCAAAGACACAGAAAAGT
|
||||||
|
ACTGTGCCCTTGCACCTAATATGATGGTAACAAACAATACCTTCACACTCAAAGGCGGTGCACCAACAAA
|
||||||
|
GGTTACTTTTGGTGATGACACTGTGATAGAAGTGCAAGGTTACAAGAGTGTGAATATCACTTTTGAACTT
|
||||||
|
GATGAAAGGATTGATAAAGTACTTAATGAGAAGTGCTCTGCCTATACAGTTGAACTCGGTACAGAAGTAA
|
||||||
|
ATGAGTTCGCCTGTGTTGTGGCAGATGCTGTCATAAAAACTTTGCAACCAGTATCTGAATTACTTACACC
|
||||||
|
ACTGGGCATTGATTTAGATGAGTGGAGTATGGCTACATACTACTTATTTGATGAGTCTGGTGAGTTTAAA
|
||||||
|
TTGGCTTCACATATGTATTGTTCTTTCTACCCTCCAGATGAGGATGAAGAAGAAGGTGATTGTGAAGAAG
|
||||||
|
AAGAGTTTGAGCCATCAACTCAATATGAGTATGGTACTGAAGATGATTACCAAGGTAAACCTTTGGAATT
|
||||||
|
TGGTGCCACTTCTGCTGCTCTTCAACCTGAAGAAGAGCAAGAAGAAGATTGGTTAGATGATGATAGTCAA
|
||||||
|
CAAACTGTTGGTCAACAAGACGGCAGTGAGGACAATCAGACAACTACTATTCAAACAATTGTTGAGGTTC
|
||||||
|
AACCTCAATTAGAGATGGAACTTACACCAGTTGTTCAGACTATTGAAGTGAATAGTTTTAGTGGTTATTT
|
||||||
|
AAAACTTACTGACAATGTATACATTAAAAATGCAGACATTGTGGAAGAAGCTAAAAAGGTAAAACCAACA
|
||||||
|
GTGGTTGTTAATGCAGCCAATGTTTACCTTAAACATGGAGGAGGTGTTGCAGGAGCCTTAAATAAGGCTA
|
||||||
|
CTAACAATGCCATGCAAGTTGAATCTGATGATTACATAGCTACTAATGGACCACTTAAAGTGGGTGGTAG
|
||||||
|
TTGTGTTTTAAGCGGACACAATCTTGCTAAACACTGTCTTCATGTTGTCGGCCCAAATGTTAACAAAGGT
|
||||||
|
GAAGACATTCAACTTCTTAAGAGTGCTTATGAAAATTTTAATCAGCACGAAGTTCTACTTGCACCATTAT
|
||||||
|
TATCAGCTGGTATTTTTGGTGCTGACCCTATACATTCTTTAAGAGTTTGTGTAGATACTGTTCGCACAAA
|
||||||
|
TGTCTACTTAGCTGTCTTTGATAAAAATCTCTATGACAAACTTGTTTCAAGCTTTTTGGAAATGAAGAGT
|
||||||
|
GAAAAGCAAGTTGAACAAAAGATCGCTGAGATTCCTAAAGAGGAAGTTAAGCCATTTATAACTGAAAGTA
|
||||||
|
AACCTTCAGTTGAACAGAGAAAACAAGATGATAAGAAAATCAAAGCTTGTGTTGAAGAAGTTACAACAAC
|
||||||
|
TCTGGAAGAAACTAAGTTCCTCACAGAAAACTTGTTACTTTATATTGACATTAATGGCAATCTTCATCCA
|
||||||
|
GATTCTGCCACTCTTGTTAGTGACATTGACATCACTTTCTTAAAGAAAGATGCTCCATATATAGTGGGTG
|
||||||
|
ATGTTGTTCAAGAGGGTGTTTTAACTGCTGTGGTTATACCTACTAAAAAGGCTGGTGGCACTACTGAAAT
|
||||||
|
GCTAGCGAAAGCTTTGAGAAAAGTGCCAACAGACAATTATATAACCACTTACCCGGGTCAGGGTTTAAAT
|
||||||
|
GGTTACACTGTAGAGGAGGCAAAGACAGTGCTTAAAAAGTGTAAAAGTGCCTTTTACATTCTACCATCTA
|
||||||
|
TTATCTCTAATGAGAAGCAAGAAATTCTTGGAACTGTTTCTTGGAATTTGCGAGAAATGCTTGCACATGC
|
||||||
|
AGAAGAAACACGCAAATTAATGCCTGTCTGTGTGGAAACTAAAGCCATAGTTTCAACTATACAGCGTAAA
|
||||||
|
TATAAGGGTATTAAAATACAAGAGGGTGTGGTTGATTATGGTGCTAGATTTTACTTTTACACCAGTAAAA
|
||||||
|
CAACTGTAGCGTCACTTATCAACACACTTAACGATCTAAATGAAACTCTTGTTACAATGCCACTTGGCTA
|
||||||
|
TGTAACACATGGCTTAAATTTGGAAGAAGCTGCTCGGTATATGAGATCTCTCAAAGTGCCAGCTACAGTT
|
||||||
|
TCTGTTTCTTCACCTGATGCTGTTACAGCGTATAATGGTTATCTTACTTCTTCTTCTAAAACACCTGAAG
|
||||||
|
AACATTTTATTGAAACCATCTCACTTGCTGGTTCCTATAAAGATTGGTCCTATTCTGGACAATCTACACA
|
||||||
|
ACTAGGTATAGAATTTCTTAAGAGAGGTGATAAAAGTGTATATTACACTAGTAATCCTACCACATTCCAC
|
||||||
|
CTAGATGGTGAAGTTATCACCTTTGACAATCTTAAGACACTTCTTTCTTTGAGAGAAGTGAGGACTATTA
|
||||||
|
AGGTGTTTACAACAGTAGACAACATTAACCTCCACACGCAAGTTGTGGACATGTCAATGACATATGGACA
|
||||||
|
ACAGTTTGGTCCAACTTATTTGGATGGAGCTGATGTTACTAAAATAAAACCTCATAATTCACATGAAGGT
|
||||||
|
AAAACATTTTATGTTTTACCTAATGATGACACTCTACGTGTTGAGGCTTTTGAGTACTACCACACAACTG
|
||||||
|
ATCCTAGTTTTCTGGGTAGGTACATGTCAGCATTAAATCACACTAAAAAGTGGAAATACCCACAAGTTAA
|
||||||
|
TGGTTTAACTTCTATTAAATGGGCAGATAACAACTGTTATCTTGCCACTGCATTGTTAACACTCCAACAA
|
||||||
|
ATAGAGTTGAAGTTTAATCCACCTGCTCTACAAGATGCTTATTACAGAGCAAGGGCTGGTGAAGCTGCTA
|
||||||
|
ACTTTTGTGCACTTATCTTAGCCTACTGTAATAAGACAGTAGGTGAGTTAGGTGATGTTAGAGAAACAAT
|
||||||
|
GAGTTACTTGTTTCAACATGCCAATTTAGATTCTTGCAAAAGAGTCTTGAACGTGGTGTGTAAAACTTGT
|
||||||
|
GGACAACAGCAGACAACCCTTAAGGGTGTAGAAGCTGTTATGTACATGGGCACACTTTCTTATGAACAAT
|
||||||
|
TTAAGAAAGGTGTTCAGATACCTTGTACGTGTGGTAAACAAGCTACAAAATATCTAGTACAACAGGAGTC
|
||||||
|
ACCTTTTGTTATGATGTCAGCACCACCTGCTCAGTATGAACTTAAGCATGGTACATTTACTTGTGCTAGT
|
||||||
|
GAGTACACTGGTAATTACCAGTGTGGTCACTATAAACATATAACTTCTAAAGAAACTTTGTATTGCATAG
|
||||||
|
ACGGTGCTTTACTTACAAAGTCCTCAGAATACAAAGGTCCTATTACGGATGTTTTCTACAAAGAAAACAG
|
||||||
|
TTACACAACAACCATAAAACCAGTTACTTATAAATTGGATGGTGTTGTTTGTACAGAAATTGACCCTAAG
|
||||||
|
TTGGACAATTATTATAAGAAAGACAATTCTTATTTCACAGAGCAACCAATTGATCTTGTACCAAACCAAC
|
||||||
|
CATATCCAAACGCAAGCTTCGATAATTTTAAGTTTGTATGTGATAATATCAAATTTGCTGATGATTTAAA
|
||||||
|
CCAGTTAACTGGTTATAAGAAACCTGCTTCAAGAGAGCTTAAAGTTACATTTTTCCCTGACTTAAATGGT
|
||||||
|
GATGTGGTGGCTATTGATTATAAACACTACACACCCTCTTTTAAGAAAGGAGCTAAATTGTTACATAAAC
|
||||||
|
CTATTGTTTGGCATGTTAACAATGCAACTAATAAAGCCACGTATAAACCAAATACCTGGTGTATACGTTG
|
||||||
|
TCTTTGGAGCACAAAACCAGTTGAAACATCAAATTCGTTTGATGTACTGAAGTCAGAGGACGCGCAGGGA
|
||||||
|
ATGGATAATCTTGCCTGCGAAGATCTAAAACCAGTCTCTGAAGAAGTAGTGGAAAATCCTACCATACAGA
|
||||||
|
AAGACGTTCTTGAGTGTAATGTGAAAACTACCGAAGTTGTAGGAGACATTATACTTAAACCAGCAAATAA
|
||||||
|
TAGTTTAAAAATTACAGAAGAGGTTGGCCACACAGATCTAATGGCTGCTTATGTAGACAATTCTAGTCTT
|
||||||
|
ACTATTAAGAAACCTAATGAATTATCTAGAGTATTAGGTTTGAAAACCCTTGCTACTCATGGTTTAGCTG
|
||||||
|
CTGTTAATAGTGTCCCTTGGGATACTATAGCTAATTATGCTAAGCCTTTTCTTAACAAAGTTGTTAGTAC
|
||||||
|
AACTACTAACATAGTTACACGGTGTTTAAACCGTGTTTGTACTAATTATATGCCTTATTTCTTTACTTTA
|
||||||
|
TTGCTACAATTGTGTACTTTTACTAGAAGTACAAATTCTAGAATTAAAGCATCTATGCCGACTACTATAG
|
||||||
|
CAAAGAATACTGTTAAGAGTGTCGGTAAATTTTGTCTAGAGGCTTCATTTAATTATTTGAAGTCACCTAA
|
||||||
|
TTTTTCTAAACTGATAAATATTATAATTTGGTTTTTACTATTAAGTGTTTGCCTAGGTTCTTTAATCTAC
|
||||||
|
TCAACCGCTGCTTTAGGTGTTTTAATGTCTAATTTAGGCATGCCTTCTTACTGTACTGGTTACAGAGAAG
|
||||||
|
GCTATTTGAACTCTACTAATGTCACTATTGCAACCTACTGTACTGGTTCTATACCTTGTAGTGTTTGTCT
|
||||||
|
TAGTGGTTTAGATTCTTTAGACACCTATCCTTCTTTAGAAACTATACAAATTACCATTTCATCTTTTAAA
|
||||||
|
TGGGATTTAACTGCTTTTGGCTTAGTTGCAGAGTGGTTTTTGGCATATATTCTTTTCACTAGGTTTTTCT
|
||||||
|
ATGTACTTGGATTGGCTGCAATCATGCAATTGTTTTTCAGCTATTTTGCAGTACATTTTATTAGTAATTC
|
||||||
|
TTGGCTTATGTGGTTAATAATTAATCTTGTACAAATGGCCCCGATTTCAGCTATGGTTAGAATGTACATC
|
||||||
|
TTCTTTGCATCATTTTATTATGTATGGAAAAGTTATGTGCATGTTGTAGACGGTTGTAATTCATCAACTT
|
||||||
|
GTATGATGTGTTACAAACGTAATAGAGCAACAAGAGTCGAATGTACAACTATTGTTAATGGTGTTAGAAG
|
||||||
|
GTCCTTTTATGTCTATGCTAATGGAGGTAAAGGCTTTTGCAAACTACACAATTGGAATTGTGTTAATTGT
|
||||||
|
GATACATTCTGTGCTGGTAGTACATTTATTAGTGATGAAGTTGCGAGAGACTTGTCACTACAGTTTAAAA
|
||||||
|
GACCAATAAATCCTACTGACCAGTCTTCTTACATCGTTGATAGTGTTACAGTGAAGAATGGTTCCATCCA
|
||||||
|
TCTTTACTTTGATAAAGCTGGTCAAAAGACTTATGAAAGACATTCTCTCTCTCATTTTGTTAACTTAGAC
|
||||||
|
AACCTGAGAGCTAATAACACTAAAGGTTCATTGCCTATTAATGTTATAGTTTTTGATGGTAAATCAAAAT
|
||||||
|
GTGAAGAATCATCTGCAAAATCAGCGTCTGTTTACTACAGTCAGCTTATGTGTCAACCTATACTGTTACT
|
||||||
|
AGATCAGGCATTAGTGTCTGATGTTGGTGATAGTGCGGAAGTTGCAGTTAAAATGTTTGATGCTTACGTT
|
||||||
|
AATACGTTTTCATCAACTTTTAACGTACCAATGGAAAAACTCAAAACACTAGTTGCAACTGCAGAAGCTG
|
||||||
|
AACTTGCAAAGAATGTGTCCTTAGACAATGTCTTATCTACTTTTATTTCAGCAGCTCGGCAAGGGTTTGT
|
||||||
|
TGATTCAGATGTAGAAACTAAAGATGTTGTTGAATGTCTTAAATTGTCACATCAATCTGACATAGAAGTT
|
||||||
|
ACTGGCGATAGTTGTAATAACTATATGCTCACCTATAACAAAGTTGAAAACATGACACCCCGTGACCTTG
|
||||||
|
GTGCTTGTATTGACTGTAGTGCGCGTCATATTAATGCGCAGGTAGCAAAAAGTCACAACATTGCTTTGAT
|
||||||
|
ATGGAACGTTAAAGATTTCATGTCATTGTCTGAACAACTACGAAAACAAATACGTAGTGCTGCTAAAAAG
|
||||||
|
AATAACTTACCTTTTAAGTTGACATGTGCAACTACTAGACAAGTTGTTAATGTTGTAACAACAAAGATAG
|
||||||
|
CACTTAAGGGTGGTAAAATTGTTAATAATTGGTTGAAGCAGTTAATTAAAGTTACACTTGTGTTCCTTTT
|
||||||
|
TGTTGCTGCTATTTTCTATTTAATAACACCTGTTCATGTCATGTCTAAACATACTGACTTTTCAAGTGAA
|
||||||
|
ATCATAGGATACAAGGCTATTGATGGTGGTGTCACTCGTGACATAGCATCTACAGATACTTGTTTTGCTA
|
||||||
|
ACAAACATGCTGATTTTGACACATGGTTTAGCCAGCGTGGTGGTAGTTATACTAATGACAAAGCTTGCCC
|
||||||
|
ATTGATTGCTGCAGTCATAACAAGAGAAGTGGGTTTTGTCGTGCCTGGTTTGCCTGGCACGATATTACGC
|
||||||
|
ACAACTAATGGTGACTTTTTGCATTTCTTACCTAGAGTTTTTAGTGCAGTTGGTAACATCTGTTACACAC
|
||||||
|
CATCAAAACTTATAGAGTACACTGACTTTGCAACATCAGCTTGTGTTTTGGCTGCTGAATGTACAATTTT
|
||||||
|
TAAAGATGCTTCTGGTAAGCCAGTACCATATTGTTATGATACCAATGTACTAGAAGGTTCTGTTGCTTAT
|
||||||
|
GAAAGTTTACGCCCTGACACACGTTATGTGCTCATGGATGGCTCTATTATTCAATTTCCTAACACCTACC
|
||||||
|
TTGAAGGTTCTGTTAGAGTGGTAACAACTTTTGATTCTGAGTACTGTAGGCACGGCACTTGTGAAAGATC
|
||||||
|
AGAAGCTGGTGTTTGTGTATCTACTAGTGGTAGATGGGTACTTAACAATGATTATTACAGATCTTTACCA
|
||||||
|
GGAGTTTTCTGTGGTGTAGATGCTGTAAATTTACTTACTAATATGTTTACACCACTAATTCAACCTATTG
|
||||||
|
GTGCTTTGGACATATCAGCATCTATAGTAGCTGGTGGTATTGTAGCTATCGTAGTAACATGCCTTGCCTA
|
||||||
|
CTATTTTATGAGGTTTAGAAGAGCTTTTGGTGAATACAGTCATGTAGTTGCCTTTAATACTTTACTATTC
|
||||||
|
CTTATGTCATTCACTGTACTCTGTTTAACACCAGTTTACTCATTCTTACCTGGTGTTTATTCTGTTATTT
|
||||||
|
ACTTGTACTTGACATTTTATCTTACTAATGATGTTTCTTTTTTAGCACATATTCAGTGGATGGTTATGTT
|
||||||
|
CACACCTTTAGTACCTTTCTGGATAACAATTGCTTATATCATTTGTATTTCCACAAAGCATTTCTATTGG
|
||||||
|
TTCTTTAGTAATTACCTAAAGAGACGTGTAGTCTTTAATGGTGTTTCCTTTAGTACTTTTGAAGAAGCTG
|
||||||
|
CGCTGTGCACCTTTTTGTTAAATAAAGAAATGTATCTAAAGTTGCGTAGTGATGTGCTATTACCTCTTAC
|
||||||
|
GCAATATAATAGATACTTAGCTCTTTATAATAAGTACAAGTATTTTAGTGGAGCAATGGATACAACTAGC
|
||||||
|
TACAGAGAAGCTGCTTGTTGTCATCTCGCAAAGGCTCTCAATGACTTCAGTAACTCAGGTTCTGATGTTC
|
||||||
|
TTTACCAACCACCACAAACCTCTATCACCTCAGCTGTTTTGCAGAGTGGTTTTAGAAAAATGGCATTCCC
|
||||||
|
ATCTGGTAAAGTTGAGGGTTGTATGGTACAAGTAACTTGTGGTACAACTACACTTAACGGTCTTTGGCTT
|
||||||
|
GATGACGTAGTTTACTGTCCAAGACATGTGATCTGCACCTCTGAAGACATGCTTAACCCTAATTATGAAG
|
||||||
|
ATTTACTCATTCGTAAGTCTAATCATAATTTCTTGGTACAGGCTGGTAATGTTCAACTCAGGGTTATTGG
|
||||||
|
ACATTCTATGCAAAATTGTGTACTTAAGCTTAAGGTTGATACAGCCAATCCTAAGACACCTAAGTATAAG
|
||||||
|
TTTGTTCGCATTCAACCAGGACAGACTTTTTCAGTGTTAGCTTGTTACAATGGTTCACCATCTGGTGTTT
|
||||||
|
ACCAATGTGCTATGAGGCCCAATTTCACTATTAAGGGTTCATTCCTTAATGGTTCATGTGGTAGTGTTGG
|
||||||
|
TTTTAACATAGATTATGACTGTGTCTCTTTTTGTTACATGCACCATATGGAATTACCAACTGGAGTTCAT
|
||||||
|
GCTGGCACAGACTTAGAAGGTAACTTTTATGGACCTTTTGTTGACAGGCAAACAGCACAAGCAGCTGGTA
|
||||||
|
CGGACACAACTATTACAGTTAATGTTTTAGCTTGGTTGTACGCTGCTGTTATAAATGGAGACAGGTGGTT
|
||||||
|
TCTCAATCGATTTACCACAACTCTTAATGACTTTAACCTTGTGGCTATGAAGTACAATTATGAACCTCTA
|
||||||
|
ACACAAGACCATGTTGACATACTAGGACCTCTTTCTGCTCAAACTGGAATTGCCGTTTTAGATATGTGTG
|
||||||
|
CTTCATTAAAAGAATTACTGCAAAATGGTATGAATGGACGTACCATATTGGGTAGTGCTTTATTAGAAGA
|
||||||
|
TGAATTTACACCTTTTGATGTTGTTAGACAATGCTCAGGTGTTACTTTCCAAAGTGCAGTGAAAAGAACA
|
||||||
|
ATCAAGGGTACACACCACTGGTTGTTACTCACAATTTTGACTTCACTTTTAGTTTTAGTCCAGAGTACTC
|
||||||
|
AATGGTCTTTGTTCTTTTTTTTGTATGAAAATGCCTTTTTACCTTTTGCTATGGGTATTATTGCTATGTC
|
||||||
|
TGCTTTTGCAATGATGTTTGTCAAACATAAGCATGCATTTCTCTGTTTGTTTTTGTTACCTTCTCTTGCC
|
||||||
|
ACTGTAGCTTATTTTAATATGGTCTATATGCCTGCTAGTTGGGTGATGCGTATTATGACATGGTTGGATA
|
||||||
|
TGGTTGATACTAGTTTGTCTGGTTTTAAGCTAAAAGACTGTGTTATGTATGCATCAGCTGTAGTGTTACT
|
||||||
|
AATCCTTATGACAGCAAGAACTGTGTATGATGATGGTGCTAGGAGAGTGTGGACACTTATGAATGTCTTG
|
||||||
|
ACACTCGTTTATAAAGTTTATTATGGTAATGCTTTAGATCAAGCCATTTCCATGTGGGCTCTTATAATCT
|
||||||
|
CTGTTACTTCTAACTACTCAGGTGTAGTTACAACTGTCATGTTTTTGGCCAGAGGTATTGTTTTTATGTG
|
||||||
|
TGTTGAGTATTGCCCTATTTTCTTCATAACTGGTAATACACTTCAGTGTATAATGCTAGTTTATTGTTTC
|
||||||
|
TTAGGCTATTTTTGTACTTGTTACTTTGGCCTCTTTTGTTTACTCAACCGCTACTTTAGACTGACTCTTG
|
||||||
|
GTGTTTATGATTACTTAGTTTCTACACAGGAGTTTAGATATATGAATTCACAGGGACTACTCCCACCCAA
|
||||||
|
GAATAGCATAGATGCCTTCAAACTCAACATTAAATTGTTGGGTGTTGGTGGCAAACCTTGTATCAAAGTA
|
||||||
|
GCCACTGTACAGTCTAAAATGTCAGATGTAAAGTGCACATCAGTAGTCTTACTCTCAGTTTTGCAACAAC
|
||||||
|
TCAGAGTAGAATCATCATCTAAATTGTGGGCTCAATGTGTCCAGTTACACAATGACATTCTCTTAGCTAA
|
||||||
|
AGATACTACTGAAGCCTTTGAAAAAATGGTTTCACTACTTTCTGTTTTGCTTTCCATGCAGGGTGCTGTA
|
||||||
|
GACATAAACAAGCTTTGTGAAGAAATGCTGGACAACAGGGCAACCTTACAAGCTATAGCCTCAGAGTTTA
|
||||||
|
GTTCCCTTCCATCATATGCAGCTTTTGCTACTGCTCAAGAAGCTTATGAGCAGGCTGTTGCTAATGGTGA
|
||||||
|
TTCTGAAGTTGTTCTTAAAAAGTTGAAGAAGTCTTTGAATGTGGCTAAATCTGAATTTGACCGTGATGCA
|
||||||
|
GCCATGCAACGTAAGTTGGAAAAGATGGCTGATCAAGCTATGACCCAAATGTATAAACAGGCTAGATCTG
|
||||||
|
AGGACAAGAGGGCAAAAGTTACTAGTGCTATGCAGACAATGCTTTTCACTATGCTTAGAAAGTTGGATAA
|
||||||
|
TGATGCACTCAACAACATTATCAACAATGCAAGAGATGGTTGTGTTCCCTTGAACATAATACCTCTTACA
|
||||||
|
ACAGCAGCCAAACTAATGGTTGTCATACCAGACTATAACACATATAAAAATACGTGTGATGGTACAACAT
|
||||||
|
TTACTTATGCATCAGCATTGTGGGAAATCCAACAGGTTGTAGATGCAGATAGTAAAATTGTTCAACTTAG
|
||||||
|
TGAAATTAGTATGGACAATTCACCTAATTTAGCATGGCCTCTTATTGTAACAGCTTTAAGGGCCAATTCT
|
||||||
|
GCTGTCAAATTACAGAATAATGAGCTTAGTCCTGTTGCACTACGACAGATGTCTTGTGCTGCCGGTACTA
|
||||||
|
CACAAACTGCTTGCACTGATGACAATGCGTTAGCTTACTACAACACAACAAAGGGAGGTAGGTTTGTACT
|
||||||
|
TGCACTGTTATCCGATTTACAGGATTTGAAATGGGCTAGATTCCCTAAGAGTGATGGAACTGGTACTATC
|
||||||
|
TATACAGAACTGGAACCACCTTGTAGGTTTGTTACAGACACACCTAAAGGTCCTAAAGTGAAGTATTTAT
|
||||||
|
ACTTTATTAAAGGATTAAACAACCTAAATAGAGGTATGGTACTTGGTAGTTTAGCTGCCACAGTACGTCT
|
||||||
|
ACAAGCTGGTAATGCAACAGAAGTGCCTGCCAATTCAACTGTATTATCTTTCTGTGCTTTTGCTGTAGAT
|
||||||
|
GCTGCTAAAGCTTACAAAGATTATCTAGCTAGTGGGGGACAACCAATCACTAATTGTGTTAAGATGTTGT
|
||||||
|
GTACACACACTGGTACTGGTCAGGCAATAACAGTTACACCGGAAGCCAATATGGATCAAGAATCCTTTGG
|
||||||
|
TGGTGCATCGTGTTGTCTGTACTGCCGTTGCCACATAGATCATCCAAATCCTAAAGGATTTTGTGACTTA
|
||||||
|
AAAGGTAAGTATGTACAAATACCTACAACTTGTGCTAATGACCCTGTGGGTTTTACACTTAAAAACACAG
|
||||||
|
TCTGTACCGTCTGCGGTATGTGGAAAGGTTATGGCTGTAGTTGTGATCAACTCCGCGAACCCATGCTTCA
|
||||||
|
GTCAGCTGATGCACAATCGTTTTTAAACGGGTTTGCGGTGTAAGTGCAGCCCGTCTTACACCGTGCGGCA
|
||||||
|
CAGGCACTAGTACTGATGTCGTATACAGGGCTTTTGACATCTACAATGATAAAGTAGCTGGTTTTGCTAA
|
||||||
|
ATTCCTAAAAACTAATTGTTGTCGCTTCCAAGAAAAGGACGAAGATGACAATTTAATTGATTCTTACTTT
|
||||||
|
GTAGTTAAGAGACACACTTTCTCTAACTACCAACATGAAGAAACAATTTATAATTTACTTAAGGATTGTC
|
||||||
|
CAGCTGTTGCTAAACATGACTTCTTTAAGTTTAGAATAGACGGTGACATGGTACCACATATATCACGTCA
|
||||||
|
ACGTCTTACTAAATACACAATGGCAGACCTCGTCTATGCTTTAAGGCATTTTGATGAAGGTAATTGTGAC
|
||||||
|
ACATTAAAAGAAATACTTGTCACATACAATTGTTGTGATGATGATTATTTCAATAAAAAGGACTGGTATG
|
||||||
|
ATTTTGTAGAAAACCCAGATATATTACGCGTATACGCCAACTTAGGTGAACGTGTACGCCAAGCTTTGTT
|
||||||
|
AAAAACAGTACAATTCTGTGATGCCATGCGAAATGCTGGTATTGTTGGTGTACTGACATTAGATAATCAA
|
||||||
|
GATCTCAATGGTAACTGGTATGATTTCGGTGATTTCATACAAACCACGCCAGGTAGTGGAGTTCCTGTTG
|
||||||
|
TAGATTCTTATTATTCATTGTTAATGCCTATATTAACCTTGACCAGGGCTTTAACTGCAGAGTCACATGT
|
||||||
|
TGACACTGACTTAACAAAGCCTTACATTAAGTGGGATTTGTTAAAATATGACTTCACGGAAGAGAGGTTA
|
||||||
|
AAACTCTTTGACCGTTATTTTAAATATTGGGATCAGACATACCACCCAAATTGTGTTAACTGTTTGGATG
|
||||||
|
ACAGATGCATTCTGCATTGTGCAAACTTTAATGTTTTATTCTCTACAGTGTTCCCACCTACAAGTTTTGG
|
||||||
|
ACCACTAGTGAGAAAAATATTTGTTGATGGTGTTCCATTTGTAGTTTCAACTGGATACCACTTCAGAGAG
|
||||||
|
CTAGGTGTTGTACATAATCAGGATGTAAACTTACATAGCTCTAGACTTAGTTTTAAGGAATTACTTGTGT
|
||||||
|
ATGCTGCTGACCCTGCTATGCACGCTGCTTCTGGTAATCTATTACTAGATAAACGCACTACGTGCTTTTC
|
||||||
|
AGTAGCTGCACTTACTAACAATGTTGCTTTTCAAACTGTCAAACCCGGTAATTTTAACAAAGACTTCTAT
|
||||||
|
GACTTTGCTGTGTCTAAGGGTTTCTTTAAGGAAGGAAGTTCTGTTGAATTAAAACACTTCTTCTTTGCTC
|
||||||
|
AGGATGGTAATGCTGCTATCAGCGATTATGACTACTATCGTTATAATCTACCAACAATGTGTGATATCAG
|
||||||
|
ACAACTACTATTTGTAGTTGAAGTTGTTGATAAGTACTTTGATTGTTACGATGGTGGCTGTATTAATGCT
|
||||||
|
AACCAAGTCATCGTCAACAACCTAGACAAATCAGCTGGTTTTCCATTTAATAAATGGGGTAAGGCTAGAC
|
||||||
|
TTTATTATGATTCAATGAGTTATGAGGATCAAGATGCACTTTTCGCATATACAAAACGTAATGTCATCCC
|
||||||
|
TACTATAACTCAAATGAATCTTAAGTATGCCATTAGTGCAAAGAATAGAGCTCGCACCGTAGCTGGTGTC
|
||||||
|
TCTATCTGTAGTACTATGACCAATAGACAGTTTCATCAAAAATTATTGAAATCAATAGCCGCCACTAGAG
|
||||||
|
GAGCTACTGTAGTAATTGGAACAAGCAAATTCTATGGTGGTTGGCACAACATGTTAAAAACTGTTTATAG
|
||||||
|
TGATGTAGAAAACCCTCACCTTATGGGTTGGGATTATCCTAAATGTGATAGAGCCATGCCTAACATGCTT
|
||||||
|
AGAATTATGGCCTCACTTGTTCTTGCTCGCAAACATACAACGTGTTGTAGCTTGTCACACCGTTTCTATA
|
||||||
|
GATTAGCTAATGAGTGTGCTCAAGTATTGAGTGAAATGGTCATGTGTGGCGGTTCACTATATGTTAAACC
|
||||||
|
AGGTGGAACCTCATCAGGAGATGCCACAACTGCTTATGCTAATAGTGTTTTTAACATTTGTCAAGCTGTC
|
||||||
|
ACGGCCAATGTTAATGCACTTTTATCTACTGATGGTAACAAAATTGCCGATAAGTATGTCCGCAATTTAC
|
||||||
|
AACACAGACTTTATGAGTGTCTCTATAGAAATAGAGATGTTGACACAGACTTTGTGAATGAGTTTTACGC
|
||||||
|
ATATTTGCGTAAACATTTCTCAATGATGATACTCTCTGACGATGCTGTTGTGTGTTTCAATAGCACTTAT
|
||||||
|
GCATCTCAAGGTCTAGTGGCTAGCATAAAGAACTTTAAGTCAGTTCTTTATTATCAAAACAATGTTTTTA
|
||||||
|
TGTCTGAAGCAAAATGTTGGACTGAGACTGACCTTACTAAAGGACCTCATGAATTTTGCTCTCAACATAC
|
||||||
|
AATGCTAGTTAAACAGGGTGATGATTATGTGTACCTTCCTTACCCAGATCCATCAAGAATCCTAGGGGCC
|
||||||
|
GGCTGTTTTGTAGATGATATCGTAAAAACAGATGGTACACTTATGATTGAACGGTTCGTGTCTTTAGCTA
|
||||||
|
TAGATGCTTACCCACTTACTAAACATCCTAATCAGGAGTATGCTGATGTCTTTCATTTGTACTTACAATA
|
||||||
|
CATAAGAAAGCTACATGATGAGTTAACAGGACACATGTTAGACATGTATTCTGTTATGCTTACTAATGAT
|
||||||
|
AACACTTCAAGGTATTGGGAACCTGAGTTTTATGAGGCTATGTACACACCGCATACAGTCTTACAGGCTG
|
||||||
|
TTGGGGCTTGTGTTCTTTGCAATTCACAGACTTCATTAAGATGTGGTGCTTGCATACGTAGACCATTCTT
|
||||||
|
ATGTTGTAAATGCTGTTACGACCATGTCATATCAACATCACATAAATTAGTCTTGTCTGTTAATCCGTAT
|
||||||
|
GTTTGCAATGCTCCAGGTTGTGATGTCACAGATGTGACTCAACTTTACTTAGGAGGTATGAGCTATTATT
|
||||||
|
GTAAATCACATAAACCACCCATTAGTTTTCCATTGTGTGCTAATGGACAAGTTTTTGGTTTATATAAAAA
|
||||||
|
TACATGTGTTGGTAGCGATAATGTTACTGACTTTAATGCAATTGCAACATGTGACTGGACAAATGCTGGT
|
||||||
|
GATTACATTTTAGCTAACACCTGTACTGAAAGACTCAAGCTTTTTGCAGCAGAAACGCTCAAAGCTACTG
|
||||||
|
AGGAGACATTTAAACTGTCTTATGGTATTGCTACTGTACGTGAAGTGCTGTCTGACAGAGAATTACATCT
|
||||||
|
TTCATGGGAAGTTGGTAAACCTAGACCACCACTTAACCGAAATTATGTCTTTACTGGTTATCGTGTAACT
|
||||||
|
AAAAACAGTAAAGTACAAATAGGAGAGTACACCTTTGAAAAAGGTGACTATGGTGATGCTGTTGTTTACC
|
||||||
|
GAGGTACAACAACTTACAAATTAAATGTTGGTGATTATTTTGTGCTGACATCACATACAGTAATGCCATT
|
||||||
|
AAGTGCACCTACACTAGTGCCACAAGAGCACTATGTTAGAATTACTGGCTTATACCCAACACTCAATATC
|
||||||
|
TCAGATGAGTTTTCTAGCAATGTTGCAAATTATCAAAAGGTTGGTATGCAAAAGTATTCTACACTCCAGG
|
||||||
|
GACCACCTGGTACTGGTAAGAGTCATTTTGCTATTGGCCTAGCTCTCTACTACCCTTCTGCTCGCATAGT
|
||||||
|
GTATACAGCTTGCTCTCATGCCGCTGTTGATGCACTATGTGAGAAGGCATTAAAATATTTGCCTATAGAT
|
||||||
|
AAATGTAGTAGAATTATACCTGCACGTGCTCGTGTAGAGTGTTTTGATAAATTCAAAGTGAATTCAACAT
|
||||||
|
TAGAACAGTATGTCTTTTGTACTGTAAATGCATTGCCTGAGACGACAGCAGATATAGTTGTCTTTGATGA
|
||||||
|
AATTTCAATGGCCACAAATTATGATTTGAGTGTTGTCAATGCCAGATTACGTGCTAAGCACTATGTGTAC
|
||||||
|
ATTGGCGACCCTGCTCAATTACCTGCACCACGCACATTGCTAACTAAGGGCACACTAGAACCAGAATATT
|
||||||
|
TCAATTCAGTGTGTAGACTTATGAAAACTATAGGTCCAGACATGTTCCTCGGAACTTGTCGGCGTTGTCC
|
||||||
|
TGCTGAAATTGTTGACACTGTGAGTGCTTTGGTTTATGATAATAAGCTTAAAGCACATAAAGACAAATCA
|
||||||
|
GCTCAATGCTTTAAAATGTTTTATAAGGGTGTTATCACGCATGATGTTTCATCTGCAATTAACAGGCCAC
|
||||||
|
AAATAGGCGTGGTAAGAGAATTCCTTACACGTAACCCTGCTTGGAGAAAAGCTGTCTTTATTTCACCTTA
|
||||||
|
TAATTCACAGAATGCTGTAGCCTCAAAGATTTTGGGACTACCAACTCAAACTGTTGATTCATCACAGGGC
|
||||||
|
TCAGAATATGACTATGTCATATTCACTCAAACCACTGAAACAGCTCACTCTTGTAATGTAAACAGATTTA
|
||||||
|
ATGTTGCTATTACCAGAGCAAAAGTAGGCATACTTTGCATAATGTCTGATAGAGACCTTTATGACAAGTT
|
||||||
|
GCAATTTACAAGTCTTGAAATTCCACGTAGGAATGTGGCAACTTTACAAGCTGAAAATGTAACAGGACTC
|
||||||
|
TTTAAAGATTGTAGTAAGGTAATCACTGGGTTACATCCTACACAGGCACCTACACACCTCAGTGTTGACA
|
||||||
|
CTAAATTCAAAACTGAAGGTTTATGTGTTGACATACCTGGCATACCTAAGGACATGACCTATAGAAGACT
|
||||||
|
CATCTCTATGATGGGTTTTAAAATGAATTATCAAGTTAATGGTTACCCTAACATGTTTATCACCCGCGAA
|
||||||
|
GAAGCTATAAGACATGTACGTGCATGGATTGGCTTCGATGTCGAGGGGTGTCATGCTACTAGAGAAGCTG
|
||||||
|
TTGGTACCAATTTACCTTTACAGCTAGGTTTTTCTACAGGTGTTAACCTAGTTGCTGTACCTACAGGTTA
|
||||||
|
TGTTGATACACCTAATAATACAGATTTTTCCAGAGTTAGTGCTAAACCACCGCCTGGAGATCAATTTAAA
|
||||||
|
CACCTCATACCACTTATGTACAAAGGACTTCCTTGGAATGTAGTGCGTATAAAGATTGTACAAATGTTAA
|
||||||
|
GTGACACACTTAAAAATCTCTCTGACAGAGTCGTATTTGTCTTATGGGCACATGGCTTTGAGTTGACATC
|
||||||
|
TATGAAGTATTTTGTGAAAATAGGACCTGAGCGCACCTGTTGTCTATGTGATAGACGTGCCACATGCTTT
|
||||||
|
TCCACTGCTTCAGACACTTATGCCTGTTGGCATCATTCTATTGGATTTGATTACGTCTATAATCCGTTTA
|
||||||
|
TGATTGATGTTCAACAATGGGGTTTTACAGGTAACCTACAAAGCAACCATGATCTGTATTGTCAAGTCCA
|
||||||
|
TGGTAATGCACATGTAGCTAGTTGTGATGCAATCATGACTAGGTGTCTAGCTGTCCACGAGTGCTTTGTT
|
||||||
|
AAGCGTGTTGACTGGACTATTGAATATCCTATAATTGGTGATGAACTGAAGATTAATGCGGCTTGTAGAA
|
||||||
|
AGGTTCAACACATGGTTGTTAAAGCTGCATTATTAGCAGACAAATTCCCAGTTCTTCACGACATTGGTAA
|
||||||
|
CCCTAAAGCTATTAAGTGTGTACCTCAAGCTGATGTAGAATGGAAGTTCTATGATGCACAGCCTTGTAGT
|
||||||
|
GACAAAGCTTATAAAATAGAAGAATTATTCTATTCTTATGCCACACATTCTGACAAATTCACAGATGGTG
|
||||||
|
TATGCCTATTTTGGAATTGCAATGTCGATAGATATCCTGCTAATTCCATTGTTTGTAGATTTGACACTAG
|
||||||
|
AGTGCTATCTAACCTTAACTTGCCTGGTTGTGATGGTGGCAGTTTGTATGTAAATAAACATGCATTCCAC
|
||||||
|
ACACCAGCTTTTGATAAAAGTGCTTTTGTTAATTTAAAACAATTACCATTTTTCTATTACTCTGACAGTC
|
||||||
|
CATGTGAGTCTCATGGAAAACAAGTAGTGTCAGATATAGATTATGTACCACTAAAGTCTGCTACGTGTAT
|
||||||
|
AACACGTTGCAATTTAGGTGGTGCTGTCTGTAGACATCATGCTAATGAGTACAGATTGTATCTCGATGCT
|
||||||
|
TATAACATGATGATCTCAGCTGGCTTTAGCTTGTGGGTTTACAAACAATTTGATACTTATAACCTCTGGA
|
||||||
|
ACACTTTTACAAGACTTCAGAGTTTAGAAAATGTGGCTTTTAATGTTGTAAATAAGGGACACTTTGATGG
|
||||||
|
ACAACAGGGTGAAGTACCAGTTTCTATCATTAATAACACTGTTTACACAAAAGTTGATGGTGTTGATGTA
|
||||||
|
GAATTGTTTGAAAATAAAACAACATTACCTGTTAATGTAGCATTTGAGCTTTGGGCTAAGCGCAACATTA
|
||||||
|
AACCAGTACCAGAGGTGAAAATACTCAATAATTTGGGTGTGGACATTGCTGCTAATACTGTGATCTGGGA
|
||||||
|
CTACAAAAGAGATGCTCCAGCACATATATCTACTATTGGTGTTTGTTCTATGACTGACATAGCCAAGAAA
|
||||||
|
CCAACTGAAACGATTTGTGCACCACTCACTGTCTTTTTTGATGGTAGAGTTGATGGTCAAGTAGACTTAT
|
||||||
|
TTAGAAATGCCCGTAATGGTGTTCTTATTACAGAAGGTAGTGTTAAAGGTTTACAACCATCTGTAGGTCC
|
||||||
|
CAAACAAGCTAGTCTTAATGGAGTCACATTAATTGGAGAAGCCGTAAAAACACAGTTCAATTATTATAAG
|
||||||
|
AAAGTTGATGGTGTTGTCCAACAATTACCTGAAACTTACTTTACTCAGAGTAGAAATTTACAAGAATTTA
|
||||||
|
AACCCAGGAGTCAAATGGAAATTGATTTCTTAGAATTAGCTATGGATGAATTCATTGAACGGTATAAATT
|
||||||
|
AGAAGGCTATGCCTTCGAACATATCGTTTATGGAGATTTTAGTCATAGTCAGTTAGGTGGTTTACATCTA
|
||||||
|
CTGATTGGACTAGCTAAACGTTTTAAGGAATCACCTTTTGAATTAGAAGATTTTATTCCTATGGACAGTA
|
||||||
|
CAGTTAAAAACTATTTCATAACAGATGCGCAAACAGGTTCATCTAAGTGTGTGTGTTCTGTTATTGATTT
|
||||||
|
ATTACTTGATGATTTTGTTGAAATAATAAAATCCCAAGATTTATCTGTAGTTTCTAAGGTTGTCAAAGTG
|
||||||
|
ACTATTGACTATACAGAAATTTCATTTATGCTTTGGTGTAAAGATGGCCATGTAGAAACATTTTACCCAA
|
||||||
|
AATTACAATCTAGTCAAGCGTGGCAACCGGGTGTTGCTATGCCTAATCTTTACAAAATGCAAAGAATGCT
|
||||||
|
ATTAGAAAAGTGTGACCTTCAAAATTATGGTGATAGTGCAACATTACCTAAAGGCATAATGATGAATGTC
|
||||||
|
GCAAAATATACTCAACTGTGTCAATATTTAAACACATTAACATTAGCTGTACCCTATAATATGAGAGTTA
|
||||||
|
TACATTTTGGTGCTGGTTCTGATAAAGGAGTTGCACCAGGTACAGCTGTTTTAAGACAGTGGTTGCCTAC
|
||||||
|
GGGTACGCTGCTTGTCGATTCAGATCTTAATGACTTTGTCTCTGATGCAGATTCAACTTTGATTGGTGAT
|
||||||
|
TGTGCAACTGTACATACAGCTAATAAATGGGATCTCATTATTAGTGATATGTACGACCCTAAGACTAAAA
|
||||||
|
ATGTTACAAAAGAAAATGACTCTAAAGAGGGTTTTTTCACTTACATTTGTGGGTTTATACAACAAAAGCT
|
||||||
|
AGCTCTTGGAGGTTCCGTGGCTATAAAGATAACAGAACATTCTTGGAATGCTGATCTTTATAAGCTCATG
|
||||||
|
GGACACTTCGCATGGTGGACAGCCTTTGTTACTAATGTGAATGCGTCATCATCTGAAGCATTTTTAATTG
|
||||||
|
GATGTAATTATCTTGGCAAACCACGCGAACAAATAGATGGTTATGTCATGCATGCAAATTACATATTTTG
|
||||||
|
GAGGAATACAAATCCAATTCAGTTGTCTTCCTATTCTTTATTTGACATGAGTAAATTTCCCCTTAAATTA
|
||||||
|
AGGGGTACTGCTGTTATGTCTTTAAAAGAAGGTCAAATCAATGATATGATTTTATCTCTTCTTAGTAAAG
|
||||||
|
GTAGACTTATAATTAGAGAAAACAACAGAGTTGTTATTTCTAGTGATGTTCTTGTTAACAACTAAACGAA
|
||||||
|
CAATGTTTGTTTTTCTTGTTTTATTGCCACTAGTCTCTAGTCAGTGTGTTAATCTTACAACCAGAACTCA
|
||||||
|
ATTACCCCCTGCATACACTAATTCTTTCACACGTGGTGTTTATTACCCTGACAAAGTTTTCAGATCCTCA
|
||||||
|
GTTTTACATTCAACTCAGGACTTGTTCTTACCTTTCTTTTCCAATGTTACTTGGTTCCATGCTATACATG
|
||||||
|
TCTCTGGGACCAATGGTACTAAGAGGTTTGATAACCCTGTCCTACCATTTAATGATGGTGTTTATTTTGC
|
||||||
|
TTCCACTGAGAAGTCTAACATAATAAGAGGCTGGATTTTTGGTACTACTTTAGATTCGAAGACCCAGTCC
|
||||||
|
CTACTTATTGTTAATAACGCTACTAATGTTGTTATTAAAGTCTGTGAATTTCAATTTTGTAATGATCCAT
|
||||||
|
TTTTGGGTGTTTATTACCACAAAAACAACAAAAGTTGGATGGAAAGTGAGTTCAGAGTTTATTCTAGTGC
|
||||||
|
GAATAATTGCACTTTTGAATATGTCTCTCAGCCTTTTCTTATGGACCTTGAAGGAAAACAGGGTAATTTC
|
||||||
|
AAAAATCTTAGGGAATTTGTGTTTAAGAATATTGATGGTTATTTTAAAATATATTCTAAGCACACGCCTA
|
||||||
|
TTAATTTAGTGCGTGATCTCCCTCAGGGTTTTTCGGCTTTAGAACCATTGGTAGATTTGCCAATAGGTAT
|
||||||
|
TAACATCACTAGGTTTCAAACTTTACTTGCTTTACATAGAAGTTATTTGACTCCTGGTGATTCTTCTTCA
|
||||||
|
GGTTGGACAGCTGGTGCTGCAGCTTATTATGTGGGTTATCTTCAACCTAGGACTTTTCTATTAAAATATA
|
||||||
|
ATGAAAATGGAACCATTACAGATGCTGTAGACTGTGCACTTGACCCTCTCTCAGAAACAAAGTGTACGTT
|
||||||
|
GAAATCCTTCACTGTAGAAAAAGGAATCTATCAAACTTCTAACTTTAGAGTCCAACCAACAGAATCTATT
|
||||||
|
GTTAGATTTCCTAATATTACAAACTTGTGCCCTTTTGGTGAAGTTTTTAACGCCACCAGATTTGCATCTG
|
||||||
|
TTTATGCTTGGAACAGGAAGAGAATCAGCAACTGTGTTGCTGATTATTCTGTCCTATATAATTCCGCATC
|
||||||
|
ATTTTCCACTTTTAAGTGTTATGGAGTGTCTCCTACTAAATTAAATGATCTCTGCTTTACTAATGTCTAT
|
||||||
|
GCAGATTCATTTGTAATTAGAGGTGATGAAGTCAGACAAATCGCTCCAGGGCAAACTGGAAAGATTGCTG
|
||||||
|
ATTATAATTATAAATTACCAGATGATTTTACAGGCTGCGTTATAGCTTGGAATTCTAACAATCTTGATTC
|
||||||
|
TAAGGTTGGTGGTAATTATAATTACCTGTATAGATTGTTTAGGAAGTCTAATCTCAAACCTTTTGAGAGA
|
||||||
|
GATATTTCAACTGAAATCTATCAGGCCGGTAGCACACCTTGTAATGGTGTTGAAGGTTTTAATTGTTACT
|
||||||
|
TTCCTTTACAATCATATGGTTTCCAACCCACTAATGGTGTTGGTTACCAACCATACAGAGTAGTAGTACT
|
||||||
|
TTCTTTTGAACTTCTACATGCACCAGCAACTGTTTGTGGACCTAAAAAGTCTACTAATTTGGTTAAAAAC
|
||||||
|
AAATGTGTCAATTTCAACTTCAATGGTTTAACAGGCACAGGTGTTCTTACTGAGTCTAACAAAAAGTTTC
|
||||||
|
TGCCTTTCCAACAATTTGGCAGAGACATTGCTGACACTACTGATGCTGTCCGTGATCCACAGACACTTGA
|
||||||
|
GATTCTTGACATTACACCATGTTCTTTTGGTGGTGTCAGTGTTATAACACCAGGAACAAATACTTCTAAC
|
||||||
|
CAGGTTGCTGTTCTTTATCAGGATGTTAACTGCACAGAAGTCCCTGTTGCTATTCATGCAGATCAACTTA
|
||||||
|
CTCCTACTTGGCGTGTTTATTCTACAGGTTCTAATGTTTTTCAAACACGTGCAGGCTGTTTAATAGGGGC
|
||||||
|
TGAACATGTCAACAACTCATATGAGTGTGACATACCCATTGGTGCAGGTATATGCGCTAGTTATCAGACT
|
||||||
|
CAGACTAATTCTCCTCGGCGGGCACGTAGTGTAGCTAGTCAATCCATCATTGCCTACACTATGTCACTTG
|
||||||
|
GTGCAGAAAATTCAGTTGCTTACTCTAATAACTCTATTGCCATACCCACAAATTTTACTATTAGTGTTAC
|
||||||
|
CACAGAAATTCTACCAGTGTCTATGACCAAGACATCAGTAGATTGTACAATGTACATTTGTGGTGATTCA
|
||||||
|
ACTGAATGCAGCAATCTTTTGTTGCAATATGGCAGTTTTTGTACACAATTAAACCGTGCTTTAACTGGAA
|
||||||
|
TAGCTGTTGAACAAGACAAAAACACCCAAGAAGTTTTTGCACAAGTCAAACAAATTTACAAAACACCACC
|
||||||
|
AATTAAAGATTTTGGTGGTTTTAATTTTTCACAAATATTACCAGATCCATCAAAACCAAGCAAGAGGTCA
|
||||||
|
TTTATTGAAGATCTACTTTTCAACAAAGTGACACTTGCAGATGCTGGCTTCATCAAACAATATGGTGATT
|
||||||
|
GCCTTGGTGATATTGCTGCTAGAGACCTCATTTGTGCACAAAAGTTTAACGGCCTTACTGTTTTGCCACC
|
||||||
|
TTTGCTCACAGATGAAATGATTGCTCAATACACTTCTGCACTGTTAGCGGGTACAATCACTTCTGGTTGG
|
||||||
|
ACCTTTGGTGCAGGTGCTGCATTACAAATACCATTTGCTATGCAAATGGCTTATAGGTTTAATGGTATTG
|
||||||
|
GAGTTACACAGAATGTTCTCTATGAGAACCAAAAATTGATTGCCAACCAATTTAATAGTGCTATTGGCAA
|
||||||
|
AATTCAAGACTCACTTTCTTCCACAGCAAGTGCACTTGGAAAACTTCAAGATGTGGTCAACCAAAATGCA
|
||||||
|
CAAGCTTTAAACACGCTTGTTAAACAACTTAGCTCCAATTTTGGTGCAATTTCAAGTGTTTTAAATGATA
|
||||||
|
TCCTTTCACGTCTTGACAAAGTTGAGGCTGAAGTGCAAATTGATAGGTTGATCACAGGCAGACTTCAAAG
|
||||||
|
TTTGCAGACATATGTGACTCAACAATTAATTAGAGCTGCAGAAATCAGAGCTTCTGCTAATCTTGCTGCT
|
||||||
|
ACTAAAATGTCAGAGTGTGTACTTGGACAATCAAAAAGAGTTGATTTTTGTGGAAAGGGCTATCATCTTA
|
||||||
|
TGTCCTTCCCTCAGTCAGCACCTCATGGTGTAGTCTTCTTGCATGTGACTTATGTCCCTGCACAAGAAAA
|
||||||
|
GAACTTCACAACTGCTCCTGCCATTTGTCATGATGGAAAAGCACACTTTCCTCGTGAAGGTGTCTTTGTT
|
||||||
|
TCAAATGGCACACACTGGTTTGTAACACAAAGGAATTTTTATGAACCACAAATCATTACTACAGACAACA
|
||||||
|
CATTTGTGTCTGGTAACTGTGATGTTGTAATAGGAATTGTCAACAACACAGTTTATGATCCTTTGCAACC
|
||||||
|
TGAATTAGACTCATTCAAGGAGGAGTTAGATAAATATTTTAAGAATCATACATCACCAGATGTTGATTTA
|
||||||
|
GGTGACATCTCTGGCATTAATGCTTCAGTTGTAAACATTCAAAAAGAAATTGACCGCCTCAATGAGGTTG
|
||||||
|
CCAAGAATTTAAATGAATCTCTCATCGATCTCCAAGAACTTGGAAAGTATGAGCAGTATATAAAATGGCC
|
||||||
|
ATGGTACATTTGGCTAGGTTTTATAGCTGGCTTGATTGCCATAGTAATGGTGACAATTATGCTTTGCTGT
|
||||||
|
ATGACCAGTTGCTGTAGTTGTCTCAAGGGCTGTTGTTCTTGTGGATCCTGCTGCAAATTTGATGAAGACG
|
||||||
|
ACTCTGAGCCAGTGCTCAAAGGAGTCAAATTACATTACACATAAACGAACTTATGGATTTGTTTATGAGA
|
||||||
|
ATCTTCACAATTGGAACTGTAACTTTGAAGCAAGGTGAAATCAAGGATGCTACTCCTTCAGATTTTGTTC
|
||||||
|
GCGCTACTGCAACGATACCGATACAAGCCTCACTCCCTTTCGGATGGCTTATTGTTGGCGTTGCACTTCT
|
||||||
|
TGCTGTTTTTCAGAGCGCTTCCAAAATCATAACCCTCAAAAAGAGATGGCAACTAGCACTCTCCAAGGGT
|
||||||
|
GTTCACTTTGTTTGCAACTTGCTGTTGTTGTTTGTAACAGTTTACTCACACCTTTTGCTCGTTGCTGCTG
|
||||||
|
GCCTTGAAGCCCCTTTTCTCTATCTTTATGCTTTAGTCTACTTCTTGCAGAGTATAAACTTTGTAAGAAT
|
||||||
|
AATAATGAGGCTTTGGCTTTGCTGGAAATGCCGTTCCAAAAACCCATTACTTTATGATGCCAACTATTTT
|
||||||
|
CTTTGCTGGCATACTAATTGTTACGACTATTGTATACCTTACAATAGTGTAACTTCTTCAATTGTCATTA
|
||||||
|
CTTCAGGTGATGGCACAACAAGTCCTATTTCTGAACATGACTACCAGATTGGTGGTTATACTGAAAAATG
|
||||||
|
GGAATCTGGAGTAAAAGACTGTGTTGTATTACACAGTTACTTCACTTCAGACTATTACCAGCTGTACTCA
|
||||||
|
ACTCAATTGAGTACAGACACTGGTGTTGAACATGTTACCTTCTTCATCTACAATAAAATTGTTGATGAGC
|
||||||
|
CTGAAGAACATGTCCAAATTCACACAATCGACGGTTCATCCGGAGTTGTTAATCCAGTAATGGAACCAAT
|
||||||
|
TTATGATGAACCGACGACGACTACTAGCGTGCCTTTGTAAGCACAAGCTGATGAGTACGAACTTATGTAC
|
||||||
|
TCATTCGTTTCGGAAGAGACAGGTACGTTAATAGTTAATAGCGTACTTCTTTTTCTTGCTTTCGTGGTAT
|
||||||
|
TCTTGCTAGTTACACTAGCCATCCTTACTGCGCTTCGATTGTGTGCGTACTGCTGCAATATTGTTAACGT
|
||||||
|
GAGTCTTGTAAAACCTTCTTTTTACGTTTACTCTCGTGTTAAAAATCTGAATTCTTCTAGAGTTCCTGAT
|
||||||
|
CTTCTGGTCTAAACGAACTAAATATTATATTAGTTTTTCTGTTTGGAACTTTAATTTTAGCCATGGCAGA
|
||||||
|
TTCCAACGGTACTATTACCGTTGAAGAGCTTAAAAAGCTCCTTGAACAATGGAACCTAGTAATAGGTTTC
|
||||||
|
CTATTCCTTACATGGATTTGTCTTCTACAATTTGCCTATGCCAACAGGAATAGGTTTTTGTATATAATTA
|
||||||
|
AGTTAATTTTCCTCTGGCTGTTATGGCCAGTAACTTTAGCTTGTTTTGTGCTTGCTGCTGTTTACAGAAT
|
||||||
|
AAATTGGATCACCGGTGGAATTGCTATCGCAATGGCTTGTCTTGTAGGCTTGATGTGGCTCAGCTACTTC
|
||||||
|
ATTGCTTCTTTCAGACTGTTTGCGCGTACGCGTTCCATGTGGTCATTCAATCCAGAAACTAACATTCTTC
|
||||||
|
TCAACGTGCCACTCCATGGCACTATTCTGACCAGACCGCTTCTAGAAAGTGAACTCGTAATCGGAGCTGT
|
||||||
|
GATCCTTCGTGGACATCTTCGTATTGCTGGACACCATCTAGGACGCTGTGACATCAAGGACCTGCCTAAA
|
||||||
|
GAAATCACTGTTGCTACATCACGAACGCTTTCTTATTACAAATTGGGAGCTTCGCAGCGTGTAGCAGGTG
|
||||||
|
ACTCAGGTTTTGCTGCATACAGTCGCTACAGGATTGGCAACTATAAATTAAACACAGACCATTCCAGTAG
|
||||||
|
CAGTGACAATATTGCTTTGCTTGTACAGTAAGTGACAACAGATGTTTCATCTCGTTGACTTTCAGGTTAC
|
||||||
|
TATAGCAGAGATATTACTAATTATTATGAGGACTTTTAAAGTTTCCATTTGGAATCTTGATTACATCATA
|
||||||
|
AACCTCATAATTAAAAATTTATCTAAGTCACTAACTGAGAATAAATATTCTCAATTAGATGAAGAGCAAC
|
||||||
|
CAATGGAGATTGATTAAACGAACATGAAAATTATTCTTTTCTTGGCACTGATAACACTCGCTACTTGTGA
|
||||||
|
GCTTTATCACTACCAAGAGTGTGTTAGAGGTACAACAGTACTTTTAAAAGAACCTTGCTCTTCTGGAACA
|
||||||
|
TACGAGGGCAATTCACCATTTCATCCTCTAGCTGATAACAAATTTGCACTGACTTGCTTTAGCACTCAAT
|
||||||
|
TTGCTTTTGCTTGTCCTGACGGCGTAAAACACGTCTATCAGTTACGTGCCAGATCAGTTTCACCTAAACT
|
||||||
|
GTTCATCAGACAAGAGGAAGTTCAAGAACTTTACTCTCCAATTTTTCTTATTGTTGCGGCAATAGTGTTT
|
||||||
|
ATAACACTTTGCTTCACACTCAAAAGAAAGACAGAATGATTGAACTTTCATTAATTGACTTCTATTTGTG
|
||||||
|
CTTTTTAGCCTTTCTGCTATTCCTTGTTTTAATTATGCTTATTATCTTTTGGTTCTCACTTGAACTGCAA
|
||||||
|
GATCATAATGAAACTTGTCACGCCTAAACGAACATGAAATTTCTTGTTTTCTTAGGAATCATCACAACTG
|
||||||
|
TAGCTGCATTTCACCAAGAATGTAGTTTACAGTCATGTACTCAACATCAACCATATGTAGTTGATGACCC
|
||||||
|
GTGTCCTATTCACTTCTATTCTAAATGGTATATTAGAGTAGGAGCTAGAAAATCAGCACCTTTAATTGAA
|
||||||
|
TTGTGCGTGGATGAGGCTGGTTCTAAATCACCCATTCAGTACATCGATATCGGTAATTATACAGTTTCCT
|
||||||
|
GTTTACCTTTTACAATTAATTGCCAGGAACCTAAATTGGGTAGTCTTGTAGTGCGTTGTTCGTTCTATGA
|
||||||
|
AGACTTTTTAGAGTATCATGACGTTCGTGTTGTTTTAGATTTCATCTAAACGAACAAACTAAAATGTCTG
|
||||||
|
ATAATGGACCCCAAAATCAGCGAAATGCACCCCGCATTACGTTTGGTGGACCCTCAGATTCAACTGGCAG
|
||||||
|
TAACCAGAATGGAGAACGCAGTGGGGCGCGATCAAAACAACGTCGGCCCCAAGGTTTACCCAATAATACT
|
||||||
|
GCGTCTTGGTTCACCGCTCTCACTCAACATGGCAAGGAAGACCTTAAATTCCCTCGAGGACAAGGCGTTC
|
||||||
|
CAATTAACACCAATAGCAGTCCAGATGACCAAATTGGCTACTACCGAAGAGCTACCAGACGAATTCGTGG
|
||||||
|
TGGTGACGGTAAAATGAAAGATCTCAGTCCAAGATGGTATTTCTACTACCTAGGAACTGGGCCAGAAGCT
|
||||||
|
GGACTTCCCTATGGTGCTAACAAAGACGGCATCATATGGGTTGCAACTGAGGGAGCCTTGAATACACCAA
|
||||||
|
AAGATCACATTGGCACCCGCAATCCTGCTAACAATGCTGCAATCGTGCTACAACTTCCTCAAGGAACAAC
|
||||||
|
ATTGCCAAAAGGCTTCTACGCAGAAGGGAGCAGAGGCGGCAGTCAAGCCTCTTCTCGTTCCTCATCACGT
|
||||||
|
AGTCGCAACAGTTCAAGAAATTCAACTCCAGGCAGCAGTAGGGGAACTTCTCCTGCTAGAATGGCTGGCA
|
||||||
|
ATGGCGGTGATGCTGCTCTTGCTTTGCTGCTGCTTGACAGATTGAACCAGCTTGAGAGCAAAATGTCTGG
|
||||||
|
TAAAGGCCAACAACAACAAGGCCAAACTGTCACTAAGAAATCTGCTGCTGAGGCTTCTAAGAAGCCTCGG
|
||||||
|
CAAAAACGTACTGCCACTAAAGCATACAATGTAACACAAGCTTTCGGCAGACGTGGTCCAGAACAAACCC
|
||||||
|
AAGGAAATTTTGGGGACCAGGAACTAATCAGACAAGGAACTGATTACAAACATTGGCCGCAAATTGCACA
|
||||||
|
ATTTGCCCCCAGCGCTTCAGCGTTCTTCGGAATGTCGCGCATTGGCATGGAAGTCACACCTTCGGGAACG
|
||||||
|
TGGTTGACCTACACAGGTGCCATCAAATTGGATGACAAAGATCCAAATTTCAAAGATCAAGTCATTTTGC
|
||||||
|
TGAATAAGCATATTGACGCATACAAAACATTCCCACCAACAGAGCCTAAAAAGGACAAAAAGAAGAAGGC
|
||||||
|
TGATGAAACTCAAGCCTTACCGCAGAGACAGAAGAAACAGCAAACTGTGACTCTTCTTCCTGCTGCAGAT
|
||||||
|
TTGGATGATTTCTCCAAACAATTGCAACAATCCATGAGCAGTGCTGACTCAACTCAGGCCTAAACTCATG
|
||||||
|
CAGACCACACAAGGCAGATGGGCTATATAAACGTTTTCGCTTTTCCGTTTACGATATATAGTCTACTCTT
|
||||||
|
GTGCAGAATGAATTCTCGTAACTACATAGCACAAGTAGATGTAGTTAACTTTAATCTCACATAGCAATCT
|
||||||
|
TTAATCAGTGTGTAACATTAGGGAGGACTTGAAAGAGCCACCACATTTTCACCGAGGCCACGCGGAGTAC
|
||||||
|
GATCGAGTGTACAGTGAACAATGCTAGGGAGAGCTGCCTATATGGAAGAGCCCTAATGTGTAAAATTAAT
|
||||||
|
TTTAGTAGTGCTATCCCCATGTGATTTTAATAGCTTCTTAGGAGAATGACAAAAAAAAAAAAAAAAAAAA
|
||||||
|
AAAAAAAAAAAAA
|
||||||
|
|
8
tests/resources/SARS_CoV-2_genes.csv
Normal file
8
tests/resources/SARS_CoV-2_genes.csv
Normal file
@ -0,0 +1,8 @@
|
|||||||
|
id,sequence,start,end
|
||||||
|
ORF8,"ATGAAATTTCTTGTTTTCTTAGGAATCATCACAACTGTAGCTGCATTTCACCAAGAATGTAGTTTACAGT
|
||||||
|
CATGTACTCAACATCAACCATATGTAGTTGATGACCCGTGTCCTATTCACTTCTATTCTAAATGGTATAT
|
||||||
|
TAGAGTAGGAGCTAGAAAATCAGCACCTTTAATTGAATTGTGCGTGGATGAGGCTGGTTCTAAATCACCC
|
||||||
|
ATTCAGTACATCGATATCGGTAATTATACAGTTTCCTGTTTACCTTTTACAATTAATTGCCAGGAACCTA
|
||||||
|
AATTGGGTAGTCTTGTAGTGCGTTGTTCGTTCTATGAAGACTTTTTAGAGTATCATGACGTTCGTGTTGT
|
||||||
|
ATGAAATTTCTTGTTTTCTTAGGAATCATCACAACTGTAGCTGCATTTCACCAAGAATGTAGTTTACAGTCATGTACTCAACATCAACCATATGTAGTTGATGACCCGTGTCCTATTCACTTCTATTCTAAATGGTATATTAGAGTAGGAGCTAGAAAATCAGCACCTTTAATTGAATTGTGCGTGGATGAGGCTGGTTCTAAATCACCCATTCAGTACATCGATATCGGTAATTATACAGTTTCCTGTTTACCTTTTACAATTAATTGCCAGGAACCTAAATTGGGTAGTCTTGTAGTGCGTTGTTCGTTCTATGAAGACTTTTTAGAGTATCATGACGTTCGTGTTGTTTTAGATTTCATCTAA",27894,28259
|
||||||
|
ORF10,ATGGGCTATATAAACGTTTTCGCTTTTCCGTTTACGATATATAGTCTACTCTTGTGCAGAATGAATTCTCGTAACTACATAGCACAAGTAGATGTAGTTAACTTTAATCTCACATAG,29558,29674
|
|
Loading…
Reference in New Issue
Block a user