diff --git a/.DS_Store b/.DS_Store new file mode 100644 index 0000000..3d63f71 Binary files /dev/null and b/.DS_Store differ diff --git a/.ipynb_checkpoints/check_k3l_test-checkpoint.ipynb b/.ipynb_checkpoints/check_k3l_test-checkpoint.ipynb new file mode 100644 index 0000000..1b4d044 --- /dev/null +++ b/.ipynb_checkpoints/check_k3l_test-checkpoint.ipynb @@ -0,0 +1,1242 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 62, + "id": "fbb00f64-ecc8-412d-ae57-9a4036440f6a", + "metadata": {}, + "outputs": [], + "source": [ + "# check that k3l_test contains appropirate variants for k3l\n", + "import pandas as pd\n", + "from Bio.Seq import Seq" + ] + }, + { + "cell_type": "code", + "execution_count": 63, + "id": "e154ddf7-fe49-461b-9e1e-35142b170139", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + " | name | \n", + "sub_window_name | \n", + "wt | \n", + "position | \n", + "iupac | \n", + "codon_sub | \n", + "iupac_aa | \n", + "synonymous_codons | \n", + "no_stop_codons | \n", + "primer | \n", + "... | \n", + "sub_window | \n", + "forward_primer | \n", + "forward_primer_tm | \n", + "forward_primer_gc | \n", + "forward_primer_len | \n", + "reverse_primer_name | \n", + "reverse_primer | \n", + "reverse_primer_tm | \n", + "reverse_primer_gc | \n", + "reverse_primer_len | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "window_1-1_GCG11HCG | \n", + "window_1-1 | \n", + "GCG | \n", + "11 | \n", + "HCG | \n", + "GCG11HCG | \n", + "TPS | \n", + "0.0 | \n", + "0.0 | \n", + "TTTGTTATTCGTTGCCCAATHCGggwgaygtwatwaarGGCAGAGT... | \n", + "... | \n", + "HCGggwgaygtwatwaar | \n", + "GGCAGAGTATACGAGAAGGATT | \n", + "51.3 | \n", + "45.5 | \n", + "22 | \n", + "rev_window_1-1 | \n", + "ATTGGGCAACGAATAACAAAATGCA | \n", + "55.1 | \n", + "36.0 | \n", + "25 | \n", + "
1 | \n", + "window_1-1_GCG11GDG | \n", + "window_1-1 | \n", + "GCG | \n", + "11 | \n", + "GDG | \n", + "GCG11GDG | \n", + "EGV | \n", + "0.0 | \n", + "0.0 | \n", + "TTTGTTATTCGTTGCCCAATGDGggwgaygtwatwaarGGCAGAGT... | \n", + "... | \n", + "GDGggwgaygtwatwaar | \n", + "GGCAGAGTATACGAGAAGGATT | \n", + "51.3 | \n", + "45.5 | \n", + "22 | \n", + "rev_window_1-1 | \n", + "ATTGGGCAACGAATAACAAAATGCA | \n", + "55.1 | \n", + "36.0 | \n", + "25 | \n", + "
2 | \n", + "window_1-1_GGT12HGT | \n", + "window_1-1 | \n", + "GGT | \n", + "12 | \n", + "HGT | \n", + "GGT12HGT | \n", + "SRC | \n", + "0.0 | \n", + "0.0 | \n", + "TTTGTTATTCGTTGCCCAATgcwHGTgaygtwatwaarGGCAGAGT... | \n", + "... | \n", + "gcwHGTgaygtwatwaar | \n", + "GGCAGAGTATACGAGAAGGATT | \n", + "51.3 | \n", + "45.5 | \n", + "22 | \n", + "rev_window_1-1 | \n", + "ATTGGGCAACGAATAACAAAATGCA | \n", + "55.1 | \n", + "36.0 | \n", + "25 | \n", + "
3 | \n", + "window_1-1_GGT12GHT | \n", + "window_1-1 | \n", + "GGT | \n", + "12 | \n", + "GHT | \n", + "GGT12GHT | \n", + "DAV | \n", + "0.0 | \n", + "0.0 | \n", + "TTTGTTATTCGTTGCCCAATgcwGHTgaygtwatwaarGGCAGAGT... | \n", + "... | \n", + "gcwGHTgaygtwatwaar | \n", + "GGCAGAGTATACGAGAAGGATT | \n", + "51.3 | \n", + "45.5 | \n", + "22 | \n", + "rev_window_1-1 | \n", + "ATTGGGCAACGAATAACAAAATGCA | \n", + "55.1 | \n", + "36.0 | \n", + "25 | \n", + "
4 | \n", + "window_1-1_GAT13HAT | \n", + "window_1-1 | \n", + "GAT | \n", + "13 | \n", + "HAT | \n", + "GAT13HAT | \n", + "NHY | \n", + "0.0 | \n", + "0.0 | \n", + "TTTGTTATTCGTTGCCCAATgcwggwHATgtwatwaarGGCAGAGT... | \n", + "... | \n", + "gcwggwHATgtwatwaar | \n", + "GGCAGAGTATACGAGAAGGATT | \n", + "51.3 | \n", + "45.5 | \n", + "22 | \n", + "rev_window_1-1 | \n", + "ATTGGGCAACGAATAACAAAATGCA | \n", + "55.1 | \n", + "36.0 | \n", + "25 | \n", + "
5 rows × 21 columns
\n", + "\n", + " | position | \n", + "iupac_aa | \n", + "wt | \n", + "
---|---|---|---|
0 | \n", + "11 | \n", + "TPSEGV | \n", + "GCG | \n", + "
1 | \n", + "12 | \n", + "SRCDAV | \n", + "GGT | \n", + "
2 | \n", + "13 | \n", + "NHYAGV | \n", + "GAT | \n", + "
3 | \n", + "14 | \n", + "ILEAG | \n", + "GTA | \n", + "
4 | \n", + "15 | \n", + "VLKTR | \n", + "ATA | \n", + "
\n", + " | codon | \n", + "aa | \n", + "position | \n", + "missense_nuc | \n", + "missense_codons | \n", + "missense_aa | \n", + "missense_iupac | \n", + "missense_iupac_codon | \n", + "sele_codons | \n", + "sele_aa | \n", + "... | \n", + "syn_bool | \n", + "syn_codons | \n", + "syn_aa | \n", + "syn_iupac_codon | \n", + "no_stop_codons | \n", + "no_stop_aa | \n", + "no_stop_iupac_codon | \n", + "no_stop_syn_codons | \n", + "no_stop_syn_aa | \n", + "no_stop_syn_iupac_codon | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "AAA | \n", + "K | \n", + "0 | \n", + "CGT | \n", + "CAA GAA TAA | \n", + "*QE | \n", + "B | \n", + "BAA | \n", + "CAA GAA TAA | \n", + "QE* | \n", + "... | \n", + "False | \n", + "\n", + " | \n", + " | BAA | \n", + "CAA GAA | \n", + "QE | \n", + "SAA | \n", + "CAA GAA | \n", + "QE | \n", + "SAA | \n", + "
1 | \n", + "AAA | \n", + "K | \n", + "1 | \n", + "CGT | \n", + "ACA AGA ATA | \n", + "TRI | \n", + "B | \n", + "ABA | \n", + "ACA AGA ATA | \n", + "TRI | \n", + "... | \n", + "False | \n", + "\n", + " | \n", + " | ABA | \n", + "ACA AGA ATA | \n", + "TRI | \n", + "ABA | \n", + "ACA AGA ATA | \n", + "TRI | \n", + "ABA | \n", + "
2 | \n", + "AAA | \n", + "K | \n", + "2 | \n", + "CT | \n", + "AAC AAT | \n", + "N | \n", + "Y | \n", + "AAY | \n", + "AAT | \n", + "N | \n", + "... | \n", + "True | \n", + "AAG AAT | \n", + "KN | \n", + "AAK | \n", + "AAT | \n", + "N | \n", + "AAT | \n", + "AAG AAT | \n", + "KN | \n", + "AAK | \n", + "
3 | \n", + "AAC | \n", + "N | \n", + "0 | \n", + "CGT | \n", + "CAC GAC TAC | \n", + "HDY | \n", + "B | \n", + "BAC | \n", + "CAC GAC TAC | \n", + "HDY | \n", + "... | \n", + "False | \n", + "\n", + " | \n", + " | BAC | \n", + "CAC GAC TAC | \n", + "HDY | \n", + "BAC | \n", + "CAC GAC TAC | \n", + "HDY | \n", + "BAC | \n", + "
4 | \n", + "AAC | \n", + "N | \n", + "1 | \n", + "CGT | \n", + "ACC AGC ATC | \n", + "TSI | \n", + "B | \n", + "ABC | \n", + "ACC AGC ATC | \n", + "TSI | \n", + "... | \n", + "False | \n", + "\n", + " | \n", + " | ABC | \n", + "ACC AGC ATC | \n", + "TSI | \n", + "ABC | \n", + "ACC AGC ATC | \n", + "TSI | \n", + "ABC | \n", + "
5 rows × 21 columns
\n", + "\n", + " | position | \n", + "iupac | \n", + "wt | \n", + "
---|---|---|---|
0 | \n", + "11 | \n", + "[HCG, GDG] | \n", + "GCG | \n", + "
1 | \n", + "12 | \n", + "[HGT, GHT] | \n", + "GGT | \n", + "
2 | \n", + "13 | \n", + "[HAT, GBT, GAA] | \n", + "GAT | \n", + "
3 | \n", + "14 | \n", + "[WTA, GVA] | \n", + "GTA | \n", + "
4 | \n", + "15 | \n", + "[KTA, AVA, ATG] | \n", + "ATA | \n", + "
\n", - " |
---|
\n", + " | name | \n", + "sub_window_name | \n", + "wt | \n", + "position | \n", + "iupac | \n", + "codon_sub | \n", + "iupac_aa | \n", + "synonymous_codons | \n", + "no_stop_codons | \n", + "primer | \n", + "... | \n", + "sub_window | \n", + "forward_primer | \n", + "forward_primer_tm | \n", + "forward_primer_gc | \n", + "forward_primer_len | \n", + "reverse_primer_name | \n", + "reverse_primer | \n", + "reverse_primer_tm | \n", + "reverse_primer_gc | \n", + "reverse_primer_len | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
4 | \n", + "window_1-1_GAT13HAT | \n", + "window_1-1 | \n", + "GAT | \n", + "13 | \n", + "HAT | \n", + "GAT13HAT | \n", + "NHY | \n", + "0.0 | \n", + "0.0 | \n", + "TTTGTTATTCGTTGCCCAATgcwggwHATgtwatwaarGGCAGAGT... | \n", + "... | \n", + "gcwggwHATgtwatwaar | \n", + "GGCAGAGTATACGAGAAGGATT | \n", + "51.3 | \n", + "45.5 | \n", + "22 | \n", + "rev_window_1-1 | \n", + "ATTGGGCAACGAATAACAAAATGCA | \n", + "55.1 | \n", + "36.0 | \n", + "25 | \n", + "
5 | \n", + "window_1-1_GAT13GBT | \n", + "window_1-1 | \n", + "GAT | \n", + "13 | \n", + "GBT | \n", + "GAT13GBT | \n", + "AGV | \n", + "0.0 | \n", + "0.0 | \n", + "TTTGTTATTCGTTGCCCAATgcwggwGBTgtwatwaarGGCAGAGT... | \n", + "... | \n", + "gcwggwGBTgtwatwaar | \n", + "GGCAGAGTATACGAGAAGGATT | \n", + "51.3 | \n", + "45.5 | \n", + "22 | \n", + "rev_window_1-1 | \n", + "ATTGGGCAACGAATAACAAAATGCA | \n", + "55.1 | \n", + "36.0 | \n", + "25 | \n", + "
6 | \n", + "window_1-1_GAT13GAA | \n", + "window_1-1 | \n", + "GAT | \n", + "13 | \n", + "GAA | \n", + "GAT13GAA | \n", + "E | \n", + "0.0 | \n", + "0.0 | \n", + "TTTGTTATTCGTTGCCCAATgcwggwGAAgtwatwaarGGCAGAGT... | \n", + "... | \n", + "gcwggwGAAgtwatwaar | \n", + "GGCAGAGTATACGAGAAGGATT | \n", + "51.3 | \n", + "45.5 | \n", + "22 | \n", + "rev_window_1-1 | \n", + "ATTGGGCAACGAATAACAAAATGCA | \n", + "55.1 | \n", + "36.0 | \n", + "25 | \n", + "
3 rows × 21 columns
\n", + "\n", + " | position | \n", + "iupac_aa | \n", + "wt_codon | \n", + "wt_aa | \n", + "wt_missense | \n", + "diff_1 | \n", + "diff_2 | \n", + "sym_diff | \n", + "
---|---|---|---|---|---|---|---|---|
0 | \n", + "11 | \n", + "{S, G, P, V, E, T} | \n", + "GCG | \n", + "A | \n", + "{G, S, P, V, E, T} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
1 | \n", + "12 | \n", + "{S, C, D, R, V, A} | \n", + "GGT | \n", + "G | \n", + "{S, C, D, R, V, A} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
2 | \n", + "13 | \n", + "{G, N, V, A, E, Y, H} | \n", + "GAT | \n", + "D | \n", + "{G, N, V, A, E, Y, H} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
3 | \n", + "14 | \n", + "{G, I, L, A, E} | \n", + "GTA | \n", + "V | \n", + "{G, I, L, A, E} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
4 | \n", + "15 | \n", + "{K, V, R, L, M, T} | \n", + "ATA | \n", + "I | \n", + "{K, V, R, L, M, T} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
5 | \n", + "16 | \n", + "{Q, N, K, R, *, E, M, T} | \n", + "AAG | \n", + "K | \n", + "{Q, N, R, *, E, M, T} | \n", + "{} | \n", + "{K} | \n", + "{K} | \n", + "
6 | \n", + "17 | \n", + "{S, C, D, R, V, A} | \n", + "GGC | \n", + "G | \n", + "{S, C, D, R, V, A} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
7 | \n", + "18 | \n", + "{G, S, I, K, *, T} | \n", + "AGA | \n", + "R | \n", + "{G, S, I, K, *, T} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
8 | \n", + "43 | \n", + "{G, I, N, C, R, T} | \n", + "AGT | \n", + "S | \n", + "{G, I, N, C, R, T} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
9 | \n", + "44 | \n", + "{G, I, D, L, A, F} | \n", + "GTT | \n", + "V | \n", + "{G, I, D, L, A, F} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
10 | \n", + "45 | \n", + "{Q, N, R, *, E, M, T} | \n", + "AAG | \n", + "K | \n", + "{Q, N, R, *, E, M, T} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
11 | \n", + "46 | \n", + "{I, K, V, R, L, T} | \n", + "ATG | \n", + "M | \n", + "{I, K, V, R, L, T} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
12 | \n", + "47 | \n", + "{Q, N, P, D, R, L, Y} | \n", + "CAT | \n", + "H | \n", + "{Q, N, P, D, R, L, Y} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
13 | \n", + "48 | \n", + "{I, K, V, R, L, T} | \n", + "ATG | \n", + "M | \n", + "{I, K, V, R, L, T} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
14 | \n", + "49 | \n", + "{G, N, V, A, E, Y, H} | \n", + "GAT | \n", + "D | \n", + "{G, N, V, A, E, Y, H} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
15 | \n", + "50 | \n", + "{G, S, I, K, *, T} | \n", + "AGA | \n", + "R | \n", + "{G, S, I, K, *, T} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
16 | \n", + "51 | \n", + "{S, N, C, D, *, F, H} | \n", + "TAT | \n", + "Y | \n", + "{S, N, C, D, *, F, H} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
17 | \n", + "71 | \n", + "{G, N, V, A, E, Y, H} | \n", + "GAT | \n", + "D | \n", + "{G, N, V, A, E, Y, H} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
18 | \n", + "72 | \n", + "{S, N, C, D, F, H} | \n", + "TAT | \n", + "Y | \n", + "{S, N, C, D, *, F, H} | \n", + "{*} | \n", + "{} | \n", + "{*} | \n", + "
19 | \n", + "73 | \n", + "{S, I, K, P, R, A} | \n", + "ACA | \n", + "T | \n", + "{S, I, K, P, R, A} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
20 | \n", + "74 | \n", + "{Q, I, N, R, *, E, T} | \n", + "AAA | \n", + "K | \n", + "{Q, I, N, R, *, E, T} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
21 | \n", + "75 | \n", + "{G, V, R, *, A, E} | \n", + "GGA | \n", + "G | \n", + "{V, R, *, A, E} | \n", + "{} | \n", + "{G} | \n", + "{G} | \n", + "
22 | \n", + "76 | \n", + "{S, N, C, D, *, F, H} | \n", + "TAT | \n", + "Y | \n", + "{S, N, C, D, *, F, H} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
23 | \n", + "77 | \n", + "{K, V, R, L, M, T} | \n", + "ATA | \n", + "I | \n", + "{K, V, R, L, M, T} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
24 | \n", + "78 | \n", + "{G, N, V, A, E, Y, H} | \n", + "GAT | \n", + "D | \n", + "{G, N, V, A, E, Y, H} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
25 | \n", + "79 | \n", + "{G, I, D, L, A, F} | \n", + "GTC | \n", + "V | \n", + "{G, I, D, L, A, F} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
26 | \n", + "80 | \n", + "{S, I, K, D, T, Y, H} | \n", + "AAT | \n", + "N | \n", + "{S, I, K, D, T, Y, H} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
27 | \n", + "81 | \n", + "{S, N, C, D, *, F, H} | \n", + "TAC | \n", + "Y | \n", + "{S, N, C, D, *, F, H} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
28 | \n", + "82 | \n", + "{Q, I, N, R, *, E, T} | \n", + "AAA | \n", + "K | \n", + "{Q, I, N, R, *, E, T} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
29 | \n", + "83 | \n", + "{G, W, S, K, R, M, T} | \n", + "AGG | \n", + "R | \n", + "{G, W, S, K, M, T} | \n", + "{} | \n", + "{R} | \n", + "{R} | \n", + "
30 | \n", + "84 | \n", + "{I, K, V, R, L, T} | \n", + "ATG | \n", + "M | \n", + "{I, K, V, R, L, T} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
31 | \n", + "85 | \n", + "{G, S, W, R, *, F, Y} | \n", + "TGT | \n", + "C | \n", + "{S, G, W, R, *, F, Y} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
32 | \n", + "86 | \n", + "{G, S, I, K, *, T} | \n", + "AGA | \n", + "R | \n", + "{G, S, I, K, *, T} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
33 | \n", + "87 | \n", + "{Q, N, P, D, R, L, Y} | \n", + "CAT | \n", + "H | \n", + "{Q, N, P, D, R, L, Y} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
34 | \n", + "88 | \n", + "{K, P, R, *, L, E, H} | \n", + "CAA | \n", + "Q | \n", + "{K, P, R, *, L, E, H} | \n", + "{} | \n", + "{} | \n", + "{} | \n", + "
\n", + " | position | \n", + "iupac_aa | \n", + "wt_codon | \n", + "wt_aa | \n", + "wt_missense | \n", + "difference | \n", + "difference_2 | \n", + "contains_wt_aa | \n", + "
---|---|---|---|---|---|---|---|---|
0 | \n", + "11 | \n", + "[, T, P, S, E, G, V, ] | \n", + "GCG | \n", + "A | \n", + "[T, P, S, E, G, V] | \n", + "{A} | \n", + "{, S, G, P, V, E, T} | \n", + "True | \n", + "
1 | \n", + "12 | \n", + "[, S, R, C, D, A, V, ] | \n", + "GGT | \n", + "G | \n", + "[S, R, C, D, A, V] | \n", + "{G} | \n", + "{, S, C, D, R, V, A} | \n", + "True | \n", + "
2 | \n", + "13 | \n", + "[, N, H, Y, A, G, V, ] | \n", + "GAT | \n", + "D | \n", + "[N, H, Y, A, G, V, E, E] | \n", + "{D} | \n", + "{, G, N, V, A, Y, H} | \n", + "True | \n", + "
3 | \n", + "14 | \n", + "[, I, L, E, A, G, ] | \n", + "GTA | \n", + "V | \n", + "[I, L, L, E, A, G] | \n", + "{V} | \n", + "{, G, I, L, A, E} | \n", + "True | \n", + "
4 | \n", + "15 | \n", + "[, V, L, K, T, R, ] | \n", + "ATA | \n", + "I | \n", + "[L, V, L, K, T, R, M] | \n", + "{I} | \n", + "{, K, V, R, L, T} | \n", + "True | \n", + "
5 | \n", + "16 | \n", + "[, Q, E, *, T, R, M, K, N, ] | \n", + "AAG | \n", + "K | \n", + "[Q, E, *, T, R, M, N, N] | \n", + "{} | \n", + "{, Q, N, R, *, E, M, T} | \n", + "False | \n", + "
6 | \n", + "17 | \n", + "[, S, R, C, D, A, V, ] | \n", + "GGC | \n", + "G | \n", + "[S, R, C, D, A, V] | \n", + "{G} | \n", + "{, S, C, D, R, V, A} | \n", + "True | \n", + "
7 | \n", + "18 | \n", + "[, G, *, K, T, I, ] | \n", + "AGA | \n", + "R | \n", + "[G, *, K, T, I, S, S] | \n", + "{R} | \n", + "{, G, I, K, *, T} | \n", + "True | \n", + "
8 | \n", + "43 | \n", + "[, G, C, N, T, I, ] | \n", + "AGT | \n", + "S | \n", + "[R, G, C, N, T, I, R, R] | \n", + "{S} | \n", + "{, G, I, N, C, T} | \n", + "True | \n", + "
9 | \n", + "44 | \n", + "[, I, L, F, D, A, G, ] | \n", + "GTT | \n", + "V | \n", + "[I, L, F, D, A, G] | \n", + "{V} | \n", + "{, G, I, D, L, A, F} | \n", + "True | \n", + "
10 | \n", + "45 | \n", + "[, Q, E, *, T, R, M, ] | \n", + "AAG | \n", + "K | \n", + "[Q, E, *, T, R, M, N, N] | \n", + "{K} | \n", + "{, Q, R, *, E, M, T} | \n", + "True | \n", + "
11 | \n", + "46 | \n", + "[, V, L, K, T, R, ] | \n", + "ATG | \n", + "M | \n", + "[L, V, L, K, T, R, I, I, I] | \n", + "{M} | \n", + "{, K, V, R, L, T} | \n", + "True | \n", + "
12 | \n", + "47 | \n", + "[, N, D, Y, P, R, L, ] | \n", + "CAT | \n", + "H | \n", + "[N, D, Y, P, R, L, Q, Q] | \n", + "{H} | \n", + "{, N, P, D, R, L, Y} | \n", + "True | \n", + "
13 | \n", + "48 | \n", + "[, V, L, K, T, R, ] | \n", + "ATG | \n", + "M | \n", + "[L, V, L, K, T, R, I, I, I] | \n", + "{M} | \n", + "{, K, V, R, L, T} | \n", + "True | \n", + "
14 | \n", + "49 | \n", + "[, N, H, Y, A, G, V, ] | \n", + "GAT | \n", + "D | \n", + "[N, H, Y, A, G, V, E, E] | \n", + "{D} | \n", + "{, G, N, V, A, Y, H} | \n", + "True | \n", + "
15 | \n", + "50 | \n", + "[, G, *, K, T, I, ] | \n", + "AGA | \n", + "R | \n", + "[G, *, K, T, I, S, S] | \n", + "{R} | \n", + "{, G, I, K, *, T} | \n", + "True | \n", + "
16 | \n", + "51 | \n", + "[, N, H, D, S, C, F, ] | \n", + "TAT | \n", + "Y | \n", + "[N, H, D, S, C, F, *, *] | \n", + "{Y} | \n", + "{, S, N, C, D, F, H} | \n", + "True | \n", + "
17 | \n", + "71 | \n", + "[, N, H, Y, A, G, V, ] | \n", + "GAT | \n", + "D | \n", + "[N, H, Y, A, G, V, E, E] | \n", + "{D} | \n", + "{, G, N, V, A, Y, H} | \n", + "True | \n", + "
18 | \n", + "72 | \n", + "[, N, H, D, S, C, F, ] | \n", + "TAT | \n", + "Y | \n", + "[N, H, D, S, C, F, *, *] | \n", + "{Y} | \n", + "{, S, N, C, D, F, H} | \n", + "True | \n", + "
19 | \n", + "73 | \n", + "[, P, A, S, K, R, I, ] | \n", + "ACA | \n", + "T | \n", + "[P, A, S, K, R, I] | \n", + "{T} | \n", + "{, S, I, K, P, R, A} | \n", + "True | \n", + "
20 | \n", + "74 | \n", + "[, Q, E, *, T, R, I, ] | \n", + "AAA | \n", + "K | \n", + "[Q, E, *, T, R, I, N, N] | \n", + "{K} | \n", + "{, Q, I, R, *, E, T} | \n", + "True | \n", + "
21 | \n", + "75 | \n", + "[, R, *, E, A, V, ] | \n", + "GGA | \n", + "G | \n", + "[R, R, *, E, A, V] | \n", + "{G} | \n", + "{, V, R, *, A, E} | \n", + "True | \n", + "
22 | \n", + "76 | \n", + "[, N, H, D, S, C, F, ] | \n", + "TAT | \n", + "Y | \n", + "[N, H, D, S, C, F, *, *] | \n", + "{Y} | \n", + "{, S, N, C, D, F, H} | \n", + "True | \n", + "
23 | \n", + "77 | \n", + "[, V, L, K, T, R, ] | \n", + "ATA | \n", + "I | \n", + "[L, V, L, K, T, R, M] | \n", + "{I} | \n", + "{, K, V, R, L, T} | \n", + "True | \n", + "
24 | \n", + "78 | \n", + "[, N, H, Y, A, G, V, ] | \n", + "GAT | \n", + "D | \n", + "[N, H, Y, A, G, V, E, E] | \n", + "{D} | \n", + "{, G, N, V, A, Y, H} | \n", + "True | \n", + "
25 | \n", + "79 | \n", + "[, I, L, F, D, A, G, ] | \n", + "GTC | \n", + "V | \n", + "[I, L, F, D, A, G] | \n", + "{V} | \n", + "{, G, I, D, L, A, F} | \n", + "True | \n", + "
26 | \n", + "80 | \n", + "[, H, D, Y, T, S, I, ] | \n", + "AAT | \n", + "N | \n", + "[H, D, Y, T, S, I, K, K] | \n", + "{N} | \n", + "{, S, I, D, T, Y, H} | \n", + "True | \n", + "
27 | \n", + "81 | \n", + "[, N, H, D, S, C, F, ] | \n", + "TAC | \n", + "Y | \n", + "[N, H, D, S, C, F, *, *] | \n", + "{Y} | \n", + "{, S, N, C, D, F, H} | \n", + "True | \n", + "
28 | \n", + "82 | \n", + "[, Q, E, *, T, R, I, ] | \n", + "AAA | \n", + "K | \n", + "[Q, E, *, T, R, I, N, N] | \n", + "{K} | \n", + "{, Q, I, R, *, E, T} | \n", + "True | \n", + "
29 | \n", + "83 | \n", + "[, G, W, K, T, M, R, S, ] | \n", + "AGG | \n", + "R | \n", + "[G, W, K, T, M, S, S] | \n", + "{} | \n", + "{, G, W, S, K, M, T} | \n", + "False | \n", + "
30 | \n", + "84 | \n", + "[, V, L, K, T, R, ] | \n", + "ATG | \n", + "M | \n", + "[L, V, L, K, T, R, I, I, I] | \n", + "{M} | \n", + "{, K, V, R, L, T} | \n", + "True | \n", + "
31 | \n", + "85 | \n", + "[, R, G, Y, S, F, *, W, ] | \n", + "TGT | \n", + "C | \n", + "[S, R, G, Y, S, F, *, W] | \n", + "{C} | \n", + "{, G, S, W, R, *, F, Y} | \n", + "True | \n", + "
32 | \n", + "86 | \n", + "[, G, *, K, T, I, ] | \n", + "AGA | \n", + "R | \n", + "[G, *, K, T, I, S, S] | \n", + "{R} | \n", + "{, G, I, K, *, T} | \n", + "True | \n", + "
33 | \n", + "87 | \n", + "[, N, D, Y, P, R, L, ] | \n", + "CAT | \n", + "H | \n", + "[N, D, Y, P, R, L, Q, Q] | \n", + "{H} | \n", + "{, N, P, D, R, L, Y} | \n", + "True | \n", + "
34 | \n", + "88 | \n", + "[, K, E, *, P, R, L, ] | \n", + "CAA | \n", + "Q | \n", + "[K, E, *, P, R, L, H, H] | \n", + "{Q} | \n", + "{, K, P, R, *, L, E} | \n", + "True | \n", + "
\n", + " | codon | \n", + "aa | \n", + "position | \n", + "missense_nuc | \n", + "missense_codons | \n", + "missense_aa | \n", + "missense_iupac | \n", + "missense_iupac_codon | \n", + "sele_codons | \n", + "sele_aa | \n", + "... | \n", + "syn_bool | \n", + "syn_codons | \n", + "syn_aa | \n", + "syn_iupac_codon | \n", + "no_stop_codons | \n", + "no_stop_aa | \n", + "no_stop_iupac_codon | \n", + "no_stop_syn_codons | \n", + "no_stop_syn_aa | \n", + "no_stop_syn_iupac_codon | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "AAA | \n", + "K | \n", + "0 | \n", + "CGT | \n", + "CAA GAA TAA | \n", + "*QE | \n", + "B | \n", + "BAA | \n", + "CAA GAA TAA | \n", + "QE* | \n", + "... | \n", + "False | \n", + "\n", + " | \n", + " | BAA | \n", + "CAA GAA | \n", + "QE | \n", + "SAA | \n", + "CAA GAA | \n", + "QE | \n", + "SAA | \n", + "
1 | \n", + "AAA | \n", + "K | \n", + "1 | \n", + "CGT | \n", + "ACA AGA ATA | \n", + "TRI | \n", + "B | \n", + "ABA | \n", + "ACA AGA ATA | \n", + "TRI | \n", + "... | \n", + "False | \n", + "\n", + " | \n", + " | ABA | \n", + "ACA AGA ATA | \n", + "TRI | \n", + "ABA | \n", + "ACA AGA ATA | \n", + "TRI | \n", + "ABA | \n", + "
2 | \n", + "AAA | \n", + "K | \n", + "2 | \n", + "CT | \n", + "AAC AAT | \n", + "N | \n", + "Y | \n", + "AAY | \n", + "AAT | \n", + "N | \n", + "... | \n", + "True | \n", + "AAG AAT | \n", + "KN | \n", + "AAK | \n", + "AAT | \n", + "N | \n", + "AAT | \n", + "AAG AAT | \n", + "KN | \n", + "AAK | \n", + "
3 | \n", + "AAC | \n", + "N | \n", + "0 | \n", + "CGT | \n", + "CAC GAC TAC | \n", + "HDY | \n", + "B | \n", + "BAC | \n", + "CAC GAC TAC | \n", + "HDY | \n", + "... | \n", + "False | \n", + "\n", + " | \n", + " | BAC | \n", + "CAC GAC TAC | \n", + "HDY | \n", + "BAC | \n", + "CAC GAC TAC | \n", + "HDY | \n", + "BAC | \n", + "
4 | \n", + "AAC | \n", + "N | \n", + "1 | \n", + "CGT | \n", + "ACC AGC ATC | \n", + "TSI | \n", + "B | \n", + "ABC | \n", + "ACC AGC ATC | \n", + "TSI | \n", + "... | \n", + "False | \n", + "\n", + " | \n", + " | ABC | \n", + "ACC AGC ATC | \n", + "TSI | \n", + "ABC | \n", + "ACC AGC ATC | \n", + "TSI | \n", + "ABC | \n", + "
5 rows × 21 columns
\n", + "\n", + " | position | \n", + "iupac | \n", + "wt | \n", + "
---|---|---|---|
0 | \n", + "11 | \n", + "[HCG, GDG] | \n", + "GCG | \n", + "
1 | \n", + "12 | \n", + "[HGT, GHT] | \n", + "GGT | \n", + "
2 | \n", + "13 | \n", + "[HAT, GBT, GAA] | \n", + "GAT | \n", + "
3 | \n", + "14 | \n", + "[WTA, GVA] | \n", + "GTA | \n", + "
4 | \n", + "15 | \n", + "[KTA, AVA, ATG] | \n", + "ATA | \n", + "
\n", - " | homology_arm | \n", - "reverse_primer | \n", - "reverse_primer_name | \n", - "forward_primer | \n", - "synonymous_included | \n", - "name | \n", - "codon_sub | \n", - "wt | \n", - "pos | \n", - "iupac | \n", - "
---|---|---|---|---|---|---|---|---|---|---|
0 | \n", - "TTTGTTATTCGTTGCCCAAT | \n", - "ATTGGGCAACGAATAACAAAATGCA | \n", - "rev_window_1-1 | \n", - "GGCAGAGTATACGAGAAGGATT | \n", - "0.0 | \n", - "window_1-1_GCG11HCG | \n", - "GCG11HCG | \n", - "GCG | \n", - "11.0 | \n", - "HCG | \n", - "
1 | \n", - "TTTGTTATTCGTTGCCCAAT | \n", - "ATTGGGCAACGAATAACAAAATGCA | \n", - "rev_window_1-1 | \n", - "GGCAGAGTATACGAGAAGGATT | \n", - "0.0 | \n", - "window_1-1_GCG11GDG | \n", - "GCG11GDG | \n", - "GCG | \n", - "11.0 | \n", - "GDG | \n", - "
2 | \n", - "TTTGTTATTCGTTGCCCAAT | \n", - "ATTGGGCAACGAATAACAAAATGCA | \n", - "rev_window_1-1 | \n", - "GGCAGAGTATACGAGAAGGATT | \n", - "0.0 | \n", - "window_1-1_GGT12HGT | \n", - "GGT12HGT | \n", - "GGT | \n", - "12.0 | \n", - "HGT | \n", - "
3 | \n", - "TTTGTTATTCGTTGCCCAAT | \n", - "ATTGGGCAACGAATAACAAAATGCA | \n", - "rev_window_1-1 | \n", - "GGCAGAGTATACGAGAAGGATT | \n", - "0.0 | \n", - "window_1-1_GGT12GHT | \n", - "GGT12GHT | \n", - "GGT | \n", - "12.0 | \n", - "GHT | \n", - "
4 | \n", - "TTTGTTATTCGTTGCCCAAT | \n", - "ATTGGGCAACGAATAACAAAATGCA | \n", - "rev_window_1-1 | \n", - "GGCAGAGTATACGAGAAGGATT | \n", - "0.0 | \n", - "window_1-1_GAT13HAT | \n", - "GAT13HAT | \n", - "GAT | \n", - "13.0 | \n", - "HAT | \n", - "
... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "... | \n", - "
92 | \n", - "TCAATTACAAAAGGATGTGT | \n", - "ACACATCCTTTTGTAATTGACATCTATATATCCT | \n", - "rev_window_3-4 | \n", - "TAGTAGCTGTCGAGTCGC | \n", - "0.0 | \n", - "window_3-4_CAT87CBT | \n", - "CAT87CBT | \n", - "CAT | \n", - "87.0 | \n", - "CBT | \n", - "
93 | \n", - "TCAATTACAAAAGGATGTGT | \n", - "ACACATCCTTTTGTAATTGACATCTATATATCCT | \n", - "rev_window_3-4 | \n", - "TAGTAGCTGTCGAGTCGC | \n", - "0.0 | \n", - "window_3-4_CAT87CAA | \n", - "CAT87CAA | \n", - "CAT | \n", - "87.0 | \n", - "CAA | \n", - "
94 | \n", - "TCAATTACAAAAGGATGTGT | \n", - "ACACATCCTTTTGTAATTGACATCTATATATCCT | \n", - "rev_window_3-4 | \n", - "TAGTAGCTGTCGAGTCGC | \n", - "0.0 | \n", - "window_3-4_CAA88DAA | \n", - "CAA88DAA | \n", - "CAA | \n", - "88.0 | \n", - "DAA | \n", - "
95 | \n", - "TCAATTACAAAAGGATGTGT | \n", - "ACACATCCTTTTGTAATTGACATCTATATATCCT | \n", - "rev_window_3-4 | \n", - "TAGTAGCTGTCGAGTCGC | \n", - "0.0 | \n", - "window_3-4_CAA88CBA | \n", - "CAA88CBA | \n", - "CAA | \n", - "88.0 | \n", - "CBA | \n", - "
96 | \n", - "TCAATTACAAAAGGATGTGT | \n", - "ACACATCCTTTTGTAATTGACATCTATATATCCT | \n", - "rev_window_3-4 | \n", - "TAGTAGCTGTCGAGTCGC | \n", - "0.0 | \n", - "window_3-4_CAA88CAT | \n", - "CAA88CAT | \n", - "CAA | \n", - "88.0 | \n", - "CAT | \n", - "
97 rows × 10 columns
\n", - "