from Bio import SeqIO from nsbdiagnosistoolkit.engine.data.MLST import Allele, MLSTProfile from nsbdiagnosistoolkit.engine.remote.databases.institutpasteur.profiling import InstitutPasteurProfiler async def test_profiling_results_in_exact_matches_when_exact(): sequence = str(SeqIO.read("tests/resources/tohama_I_bpertussis.fasta", "fasta").seq) async with InstitutPasteurProfiler(database_name="pubmlst_bordetella_seqdef") as dummy_profiler: exact_matches = dummy_profiler.fetch_mlst_allele_variants(sequence_string=sequence) targets_left = {"adk", "fumC", "glyA", "tyrB", "icd", "pepA", "pgm"} async for exact_match in exact_matches: assert isinstance(exact_match, Allele) assert exact_match.allele_variant == '1' # All of Tohama I has allele id I targets_left.remove(exact_match.allele_loci) assert len(targets_left) == 0 async def test_profiling_results_in_correct_st(): sequence = str(SeqIO.read("tests/resources/tohama_I_bpertussis.fasta", "fasta").seq) dummy_alleles = [ Allele("adk", "1"), Allele("fumC", "1"), Allele("glyA", "1"), Allele("tyrB", "1"), Allele("icd", "1"), Allele("pepA", "1"), Allele("pgm", "1"), ] async with InstitutPasteurProfiler(database_name="pubmlst_bordetella_seqdef") as dummy_profiler: exact_matches = dummy_profiler.fetch_mlst_allele_variants(sequence_string=sequence) mlst_st_data = await dummy_profiler.fetch_mlst_st(dummy_alleles) assert mlst_st_data is not None assert isinstance(mlst_st_data, MLSTProfile) assert mlst_st_data.clonal_complex == "ST-2 complex" assert mlst_st_data.sequence_type == "1"